diff --git a/data/fig1.dta b/data/fig1.dta
index c6cf242..0342866 100644
Binary files a/data/fig1.dta and b/data/fig1.dta differ
diff --git a/data/fig2.dta b/data/fig2.dta
index 6e76833..f7af3fe 100644
Binary files a/data/fig2.dta and b/data/fig2.dta differ
diff --git a/data/fig3.dta b/data/fig3.dta
index 40912a9..56bb8fd 100644
Binary files a/data/fig3.dta and b/data/fig3.dta differ
diff --git a/data/nhefs-formatted.dta b/data/nhefs-formatted.dta
index e8df4c0..1e75f95 100644
Binary files a/data/nhefs-formatted.dta and b/data/nhefs-formatted.dta differ
diff --git a/data/nhefs-highprice.dta b/data/nhefs-highprice.dta
index ceae41d..a7ee401 100644
Binary files a/data/nhefs-highprice.dta and b/data/nhefs-highprice.dta differ
diff --git a/data/nhefs-ps.dta b/data/nhefs-ps.dta
index ac5cb05..177494b 100644
Binary files a/data/nhefs-ps.dta and b/data/nhefs-ps.dta differ
diff --git a/data/nhefs-wcens.dta b/data/nhefs-wcens.dta
index e84665a..0723751 100644
Binary files a/data/nhefs-wcens.dta and b/data/nhefs-wcens.dta differ
diff --git a/data/nhefs_std.dta b/data/nhefs_std.dta
index fd0face..5f7968c 100644
Binary files a/data/nhefs_std.dta and b/data/nhefs_std.dta differ
diff --git a/data/nhefs_std1.dta b/data/nhefs_std1.dta
index 8e2c46c..16573d6 100644
Binary files a/data/nhefs_std1.dta and b/data/nhefs_std1.dta differ
diff --git a/data/nhefs_std2.dta b/data/nhefs_std2.dta
index b11c3ad..add5e86 100644
Binary files a/data/nhefs_std2.dta and b/data/nhefs_std2.dta differ
diff --git a/data/nhefs_surv.dta b/data/nhefs_surv.dta
index 1a73c0e..7e61ba3 100644
Binary files a/data/nhefs_surv.dta and b/data/nhefs_surv.dta differ
diff --git a/data/observe.mmat b/data/observe.mmat
index fbe2c0a..d8710e6 100644
Binary files a/data/observe.mmat and b/data/observe.mmat differ
diff --git a/docs/11-why-model-r.md b/docs/11-why-model-r.md
index 1d37fa4..b782354 100644
--- a/docs/11-why-model-r.md
+++ b/docs/11-why-model-r.md
@@ -10,7 +10,7 @@
 - Data from Figures 11.1 and 11.2
 
 
-```r
+``` r
 A <- c(1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0)
 Y <- c(200, 150, 220, 110, 50, 180, 90, 170, 170, 30,
        70, 110, 80, 50, 10, 20)
@@ -20,13 +20,19 @@ plot(A, Y)
 
 <img src="11-why-model-r_files/figure-epub3/unnamed-chunk-1-1.png" width="85%" style="display: block; margin: auto;" />
 
-```r
+``` r
 summary(Y[A == 0])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    10.0    27.5    60.0    67.5    87.5   170.0
+```
+
+``` r
 summary(Y[A == 1])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    50.0   105.0   160.0   146.2   185.0   220.0
+```
+
+``` r
 
 A2 <- c(1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4)
 Y2 <- c(110, 80, 50, 40, 170, 30, 70, 50, 110, 50, 180,
@@ -37,16 +43,25 @@ plot(A2, Y2)
 
 <img src="11-why-model-r_files/figure-epub3/unnamed-chunk-1-2.png" width="85%" style="display: block; margin: auto;" />
 
-```r
+``` r
 summary(Y2[A2 == 1])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    40.0    47.5    65.0    70.0    87.5   110.0
+```
+
+``` r
 summary(Y2[A2 == 2])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>      30      45      60      80      95     170
+```
+
+``` r
 summary(Y2[A2 == 3])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    50.0    95.0   120.0   117.5   142.5   180.0
+```
+
+``` r
 summary(Y2[A2 == 4])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   150.0   187.5   205.0   195.0   212.5   220.0
@@ -59,7 +74,7 @@ summary(Y2[A2 == 4])
 - Data from Figures 11.3 and 11.1
 
 
-```r
+``` r
 A3 <-
   c(3, 11, 17, 23, 29, 37, 41, 53, 67, 79, 83, 97, 60, 71, 15, 45)
 Y3 <-
@@ -71,7 +86,7 @@ plot(Y3 ~ A3)
 
 <img src="11-why-model-r_files/figure-epub3/unnamed-chunk-2-1.png" width="85%" style="display: block; margin: auto;" />
 
-```r
+``` r
 
 summary(glm(Y3 ~ A3))
 #> 
@@ -92,9 +107,15 @@ summary(glm(Y3 ~ A3))
 #> AIC: 170.43
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 predict(glm(Y3 ~ A3), data.frame(A3 = 90))
 #>      1 
 #> 216.89
+```
+
+``` r
 
 summary(glm(Y ~ A))
 #> 
@@ -123,7 +144,7 @@ summary(glm(Y ~ A))
 - Data from Figure 11.3
 
 
-```r
+``` r
 Asq <- A3 * A3
 
 mod3 <- glm(Y3 ~ A3 + Asq)
@@ -147,6 +168,9 @@ summary(mod3)
 #> AIC: 170.39
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 predict(mod3, data.frame(cbind(A3 = 90, Asq = 8100)))
 #>        1 
 #> 197.1269
diff --git a/docs/11-why-model-stata.md b/docs/11-why-model-stata.md
index 36601c4..d145dd4 100644
--- a/docs/11-why-model-stata.md
+++ b/docs/11-why-model-stata.md
@@ -3,12 +3,12 @@
 # 11. Why model: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
 
-```stata
+``` stata
 do dependency
 ```
 
@@ -35,7 +35,7 @@ For errors contact: ejmurray@bu.edu
 - Sample averages by treatment level
 
 
-```stata
+``` stata
 clear
 
 **Figure 11.1**
@@ -112,7 +112,7 @@ bysort A: sum Y
 <img src="figs/stata-fig-11-1.png" width="85%" style="display: block; margin: auto;" />
 
 
-```stata
+``` stata
 *Clear the workspace to be able to use a new dataset*
 clear
 
@@ -200,7 +200,7 @@ bysort A: sum Y
 <img src="figs/stata-fig-11-2.png" width="85%" style="display: block; margin: auto;" />
 
 
-```stata
+``` stata
 clear
 
 **Figure 11.3**
@@ -258,7 +258,7 @@ qui gr export figs/stata-fig-11-3.png, replace
 - Creates Figure 11.4, parameter estimates with 95% confidence intervals from Section 11.2, and parameter estimates with 95% confidence intervals from Section 11.3
 
 
-```stata
+``` stata
 **Section 11.2: parametric estimators**
 *Reload data
 use ./data/fig3, clear
@@ -297,7 +297,7 @@ qui gr export figs/stata-fig-11-4.png, replace
 <img src="figs/stata-fig-11-4.png" width="85%" style="display: block; margin: auto;" />
 
 
-```stata
+``` stata
 **Section 11.3: non-parametric estimation*
 * Reload the data
 use ./data/fig1, clear
@@ -325,7 +325,7 @@ di 67.50 + 78.75
 - Creates Figure 11.5 and Parameter estimates for Section 11.4
 
 
-```stata
+``` stata
 * Reload the data
 use ./data/fig3, clear
 
diff --git a/docs/12-ipw-msm-r.md b/docs/12-ipw-msm-r.md
index 9ecaa29..3601571 100644
--- a/docs/12-ipw-msm-r.md
+++ b/docs/12-ipw-msm-r.md
@@ -7,12 +7,12 @@
 - Descriptive statistics from NHEFS data (Table 12.1)
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 # install.packages("readxl") # install package if required
 library("readxl")
 
@@ -31,91 +31,151 @@ lm(wt82_71 ~ qsmk, data = nhefs.nmv)
 #> Coefficients:
 #> (Intercept)         qsmk  
 #>       1.984        2.541
+```
+
+``` r
 # Smoking cessation
 predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 1))
 #>        1 
 #> 4.525079
+```
+
+``` r
 # No smoking cessation
 predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 0))
 #>        1 
 #> 1.984498
+```
+
+``` r
 
 # Table
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$age)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   25.00   33.00   42.00   42.79   51.00   72.00
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$wt71)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   40.82   59.19   68.49   70.30   79.38  151.73
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeintensity)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    1.00   15.00   20.00   21.19   30.00   60.00
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeyrs)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    1.00   15.00   23.00   24.09   32.00   64.00
+```
+
+``` r
 
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$age)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   25.00   35.00   46.00   46.17   56.00   74.00
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$wt71)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   39.58   60.67   71.21   72.35   81.08  136.98
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeintensity)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>     1.0    10.0    20.0    18.6    25.0    80.0
+```
+
+``` r
 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeyrs)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    1.00   15.00   26.00   26.03   35.00   60.00
+```
+
+``` r
 
 table(nhefs.nmv$qsmk, nhefs.nmv$sex)
 #>    
 #>       0   1
 #>   0 542 621
 #>   1 220 183
+```
+
+``` r
 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$sex), 1)
 #>    
 #>             0         1
 #>   0 0.4660361 0.5339639
 #>   1 0.5459057 0.4540943
+```
+
+``` r
 
 table(nhefs.nmv$qsmk, nhefs.nmv$race)
 #>    
 #>       0   1
 #>   0 993 170
 #>   1 367  36
+```
+
+``` r
 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$race), 1)
 #>    
 #>              0          1
 #>   0 0.85382631 0.14617369
 #>   1 0.91066998 0.08933002
+```
+
+``` r
 
 table(nhefs.nmv$qsmk, nhefs.nmv$education)
 #>    
 #>       1   2   3   4   5
 #>   0 210 266 480  92 115
 #>   1  81  74 157  29  62
+```
+
+``` r
 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$education), 1)
 #>    
 #>              1          2          3          4          5
 #>   0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220
 #>   1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615
+```
+
+``` r
 
 table(nhefs.nmv$qsmk, nhefs.nmv$exercise)
 #>    
 #>       0   1   2
 #>   0 237 485 441
 #>   1  63 176 164
+```
+
+``` r
 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$exercise), 1)
 #>    
 #>             0         1         2
 #>   0 0.2037833 0.4170249 0.3791917
 #>   1 0.1563275 0.4367246 0.4069479
+```
+
+``` r
 
 table(nhefs.nmv$qsmk, nhefs.nmv$active)
 #>    
 #>       0   1   2
 #>   0 532 527 104
 #>   1 170 188  45
+```
+
+``` r
 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$active), 1)
 #>    
 #>             0         1         2
@@ -130,7 +190,7 @@ prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$active), 1)
 - Data from NHEFS
 
 
-```r
+``` r
 # Estimation of ip weights via a logistic model
 fit <- glm(
   qsmk ~ sex + race + age + I(age ^ 2) +
@@ -179,6 +239,9 @@ summary(fit)
 #> AIC: 1714.9
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 
 p.qsmk.obs <-
   ifelse(nhefs.nmv$qsmk == 0,
@@ -189,8 +252,14 @@ nhefs.nmv$w <- 1 / p.qsmk.obs
 summary(nhefs.nmv$w)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   1.054   1.230   1.373   1.996   1.990  16.700
+```
+
+``` r
 sd(nhefs.nmv$w)
 #> [1] 1.474787
+```
+
+``` r
 
 # install.packages("geepack") # install package if required
 library("geepack")
@@ -220,6 +289,9 @@ summary(msm.w)
 #>             Estimate Std.err
 #> (Intercept)    65.06   4.221
 #> Number of clusters:   1566  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.w)
 SE <- coef(summary(msm.w))[, 2]
@@ -229,6 +301,9 @@ cbind(beta, lcl, ucl)
 #>              beta   lcl  ucl
 #> (Intercept) 1.780 1.340 2.22
 #> qsmk        3.441 2.411 4.47
+```
+
+``` r
 
 # no association between sex and qsmk in pseudo-population
 xtabs(nhefs.nmv$w ~ nhefs.nmv$sex + nhefs.nmv$qsmk)
@@ -236,6 +311,9 @@ xtabs(nhefs.nmv$w ~ nhefs.nmv$sex + nhefs.nmv$qsmk)
 #> nhefs.nmv$sex     0     1
 #>             0 763.6 763.6
 #>             1 801.7 797.2
+```
+
+``` r
 
 # "check" for positivity (White women)
 table(nhefs.nmv$age[nhefs.nmv$race == 0 & nhefs.nmv$sex == 1],
@@ -298,7 +376,7 @@ table(nhefs.nmv$age[nhefs.nmv$race == 0 & nhefs.nmv$sex == 1],
 - Data from NHEFS
 
 
-```r
+``` r
 # estimation of denominator of ip weights
 denom.fit <-
   glm(
@@ -348,6 +426,9 @@ summary(denom.fit)
 #> AIC: 1715
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 
 pd.qsmk <- predict(denom.fit, type = "response")
 
@@ -371,6 +452,9 @@ summary(numer.fit)
 #> AIC: 1788
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 
 pn.qsmk <- predict(numer.fit, type = "response")
 
@@ -381,6 +465,9 @@ nhefs.nmv$sw <-
 summary(nhefs.nmv$sw)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>   0.331   0.867   0.950   0.999   1.079   4.298
+```
+
+``` r
 
 
 msm.sw <- geeglm(
@@ -409,6 +496,9 @@ summary(msm.sw)
 #>             Estimate Std.err
 #> (Intercept)     60.7    3.71
 #> Number of clusters:   1566  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.sw)
 SE <- coef(summary(msm.sw))[, 2]
@@ -418,6 +508,9 @@ cbind(beta, lcl, ucl)
 #>             beta  lcl  ucl
 #> (Intercept) 1.78 1.34 2.22
 #> qsmk        3.44 2.41 4.47
+```
+
+``` r
 
 # no association between sex and qsmk in pseudo-population
 xtabs(nhefs.nmv$sw ~ nhefs.nmv$sex + nhefs.nmv$qsmk)
@@ -432,7 +525,7 @@ xtabs(nhefs.nmv$sw ~ nhefs.nmv$sex + nhefs.nmv$qsmk)
 - Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS
 
 
-```r
+``` r
 # Analysis restricted to subjects reporting <=25 cig/day at baseline
 nhefs.nmv.s <- subset(nhefs.nmv, smokeintensity <= 25)
 
@@ -463,6 +556,9 @@ nhefs.nmv.s$sw.a <- dens.num / dens.den
 summary(nhefs.nmv.s$sw.a)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    0.19    0.89    0.97    1.00    1.05    5.10
+```
+
+``` r
 
 msm.sw.cont <-
   geeglm(
@@ -493,6 +589,9 @@ summary(msm.sw.cont)
 #>             Estimate Std.err
 #> (Intercept)     60.5     4.5
 #> Number of clusters:   1162  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.sw.cont)
 SE <- coef(summary(msm.sw.cont))[, 2]
@@ -511,12 +610,15 @@ cbind(beta, lcl, ucl)
 - Data from NHEFS
 
 
-```r
+``` r
 table(nhefs.nmv$qsmk, nhefs.nmv$death)
 #>    
 #>       0   1
 #>   0 963 200
 #>   1 312  91
+```
+
+``` r
 
 # First, estimation of stabilized weights sw (same as in Program 12.3)
 # Second, fit logistic model below
@@ -529,6 +631,9 @@ msm.logistic <- geeglm(
   corstr = "independence"
 )
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
+```
+
+``` r
 summary(msm.logistic)
 #> 
 #> Call:
@@ -548,6 +653,9 @@ summary(msm.logistic)
 #>             Estimate Std.err
 #> (Intercept)        1  0.0678
 #> Number of clusters:   1566  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.logistic)
 SE <- coef(summary(msm.logistic))[, 2]
@@ -565,11 +673,14 @@ cbind(beta, lcl, ucl)
 - Data from NHEFS
 
 
-```r
+``` r
 table(nhefs.nmv$sex)
 #> 
 #>   0   1 
 #> 762 804
+```
+
+``` r
 
 # estimation of denominator of ip weights
 denom.fit <-
@@ -620,6 +731,9 @@ summary(denom.fit)
 #> AIC: 1715
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 
 pd.qsmk <- predict(denom.fit, type = "response")
 
@@ -645,6 +759,9 @@ summary(numer.fit)
 #> AIC: 1782
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 pn.qsmk <- predict(numer.fit, type = "response")
 
 nhefs.nmv$sw.a <-
@@ -654,8 +771,14 @@ nhefs.nmv$sw.a <-
 summary(nhefs.nmv$sw.a)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    0.29    0.88    0.96    1.00    1.08    3.80
+```
+
+``` r
 sd(nhefs.nmv$sw.a)
 #> [1] 0.271
+```
+
+``` r
 
 # Estimating parameters of a marginal structural mean model
 msm.emm <- geeglm(
@@ -688,6 +811,9 @@ summary(msm.emm)
 #>             Estimate Std.err
 #> (Intercept)     60.8    3.71
 #> Number of clusters:   1566  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.emm)
 SE <- coef(summary(msm.emm))[, 2]
@@ -707,19 +833,28 @@ cbind(beta, lcl, ucl)
 - Data from NHEFS
 
 
-```r
+``` r
 table(nhefs$qsmk, nhefs$cens)
 #>    
 #>        0    1
 #>   0 1163   38
 #>   1  403   25
+```
+
+``` r
 
 summary(nhefs[which(nhefs$cens == 0),]$wt71)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    39.6    59.5    69.2    70.8    79.8   151.7
+```
+
+``` r
 summary(nhefs[which(nhefs$cens == 1),]$wt71)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    36.2    63.1    72.1    76.6    87.9   169.2
+```
+
+``` r
 
 # estimation of denominator of ip weights for A
 denom.fit <-
@@ -770,6 +905,9 @@ summary(denom.fit)
 #> AIC: 1805
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 
 pd.qsmk <- predict(denom.fit, type = "response")
 
@@ -793,6 +931,9 @@ summary(numer.fit)
 #> AIC: 1878
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 pn.qsmk <- predict(numer.fit, type = "response")
 
 # estimation of denominator of ip weights for C
@@ -846,6 +987,9 @@ summary(denom.cens)
 #> AIC: 505.4
 #> 
 #> Number of Fisher Scoring iterations: 7
+```
+
+``` r
 
 pd.cens <- 1 - predict(denom.cens, type = "response")
 
@@ -871,6 +1015,9 @@ summary(numer.cens)
 #> AIC: 531.8
 #> 
 #> Number of Fisher Scoring iterations: 6
+```
+
+``` r
 pn.cens <- 1 - predict(numer.cens, type = "response")
 
 nhefs$sw.a <-
@@ -882,18 +1029,36 @@ nhefs$sw <- nhefs$sw.c * nhefs$sw.a
 summary(nhefs$sw.a)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    0.33    0.86    0.95    1.00    1.08    4.21
+```
+
+``` r
 sd(nhefs$sw.a)
 #> [1] 0.284
+```
+
+``` r
 summary(nhefs$sw.c)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    0.94    0.98    0.99    1.01    1.01    7.58
+```
+
+``` r
 sd(nhefs$sw.c)
 #> [1] 0.178
+```
+
+``` r
 summary(nhefs$sw)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    0.35    0.86    0.94    1.01    1.08   12.86
+```
+
+``` r
 sd(nhefs$sw)
 #> [1] 0.411
+```
+
+``` r
 
 msm.sw <- geeglm(
   wt82_71 ~ qsmk,
@@ -921,6 +1086,9 @@ summary(msm.sw)
 #>             Estimate Std.err
 #> (Intercept)     61.8    3.83
 #> Number of clusters:   1566  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(msm.sw)
 SE <- coef(summary(msm.sw))[, 2]
diff --git a/docs/12-ipw-msm-stata.md b/docs/12-ipw-msm-stata.md
index 3938d12..ff8a539 100644
--- a/docs/12-ipw-msm-stata.md
+++ b/docs/12-ipw-msm-stata.md
@@ -1,7 +1,7 @@
 # 12. IP Weighting and Marginal Structural Models: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -19,7 +19,7 @@ For errors contact: ejmurray@bu.edu
 - Descriptive statistics from NHEFS data (Table 12.1)
 
 
-```stata
+``` stata
 use ./data/nhefs, clear
 
 /*Provisionally ignore subjects with missing values for follow-up weight*/
@@ -56,7 +56,7 @@ qui save ./data/nhefs-formatted, replace
 
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Output table*/
@@ -148,7 +148,7 @@ No smoking cessation |                 8.9
 - Data from NHEFS
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Fit a logistic model for the IP weights*/ 
@@ -259,7 +259,7 @@ Linear regression                               Number of obs     =      1,566
 - Data from NHEFS
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Fit a logistic model for the denominator of the IP weights and predict the */
@@ -495,7 +495,7 @@ Linear regression                               Number of obs     =      1,566
 - Section 12.4
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 * drop sw_a
@@ -642,7 +642,7 @@ c.smkintensity82_71 |   .0026949   .0024203     1.11   0.266    -.0020537    .00
 - Section 12.4
 
 
-```stata
+``` stata
 use ./data/nhefs, clear
 
 /*Provisionally ignore subjects with missing values for follow-up weight*/
@@ -778,7 +778,7 @@ Note: _cons estimates baseline odds.
 - Section 12.5
 
 
-```stata
+``` stata
 use ./data/nhefs, clear
 
 * drop pd_qsmk pn_qsmk sw_a
@@ -927,7 +927,7 @@ Linear regression                               Number of obs     =      1,566
 - Section 12.6
 
 
-```stata
+``` stata
 use ./data/nhefs, clear
 
 /*Analysis including all individuals regardless of missing wt82 status: N=1629*/
diff --git a/docs/13-stand-gformula-r.md b/docs/13-stand-gformula-r.md
index f36d806..f9446c9 100644
--- a/docs/13-stand-gformula-r.md
+++ b/docs/13-stand-gformula-r.md
@@ -8,12 +8,12 @@
 - Data from NHEFS
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 # install.packages("readxl") # install package if required
 library("readxl")
 nhefs <- read_excel(here("data", "NHEFS.xls"))
@@ -72,6 +72,9 @@ summary(fit)
 #> AIC: 10701
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 nhefs$predicted.meanY <- predict(fit, nhefs)
 
 nhefs[which(nhefs$seqn == 24770), c(
@@ -92,10 +95,16 @@ nhefs[which(nhefs$seqn == 24770), c(
 #>             <dbl> <dbl> <dbl> <dbl> <dbl>     <dbl>          <dbl>    <dbl>
 #> 1           0.342     0     0     0    26         4             15       12
 #> # ℹ 3 more variables: exercise <dbl>, active <dbl>, wt71 <dbl>
+```
+
+``` r
 
 summary(nhefs$predicted.meanY[nhefs$cens == 0])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #> -10.876   1.116   3.042   2.638   4.511   9.876
+```
+
+``` r
 summary(nhefs$wt82_71[nhefs$cens == 0])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #> -41.280  -1.478   2.604   2.638   6.690  48.538
@@ -107,7 +116,7 @@ summary(nhefs$wt82_71[nhefs$cens == 0])
 - Data from Table 2.2
 
 
-```r
+``` r
 id <- c(
   "Rheia",
   "Kronos",
@@ -162,12 +171,21 @@ summary(glm.obj)
 #> AIC: 35.385
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 table22$predicted.meanY <- predict(glm.obj, table22)
 
 mean(table22$predicted.meanY[table22$interv == -1])
 #> [1] 0.5
+```
+
+``` r
 mean(table22$predicted.meanY[table22$interv == 0])
 #> [1] 0.5
+```
+
+``` r
 mean(table22$predicted.meanY[table22$interv == 1])
 #> [1] 0.5
 ```
@@ -179,7 +197,7 @@ mean(table22$predicted.meanY[table22$interv == 1])
 - Data from NHEFS
 
 
-```r
+``` r
 # create a dataset with 3 copies of each subject
 nhefs$interv <- -1 # 1st copy: equal to original one
 
@@ -251,6 +269,9 @@ summary(std)
 #> AIC: 10701
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 onesample$predicted_meanY <- predict(std, onesample)
 
 # estimate mean outcome in each of the groups interv=0, and interv=1
@@ -258,8 +279,14 @@ onesample$predicted_meanY <- predict(std, onesample)
 # of values of treatment and confounders, that is, the standardized outcome
 mean(onesample[which(onesample$interv == -1), ]$predicted_meanY)
 #> [1] 2.56319
+```
+
+``` r
 mean(onesample[which(onesample$interv == 0), ]$predicted_meanY)
 #> [1] 1.660267
+```
+
+``` r
 mean(onesample[which(onesample$interv == 1), ]$predicted_meanY)
 #> [1] 5.178841
 ```
@@ -271,7 +298,7 @@ mean(onesample[which(onesample$interv == 1), ]$predicted_meanY)
 - Data from NHEFS
 
 
-```r
+``` r
 #install.packages("boot") # install package if required
 library(boot)
 
@@ -345,13 +372,13 @@ bootstrap <-
   ))
 bootstrap
 #>                         V1             mean                se               ll
-#> 1                 Observed 2.56188497106099  0.26781025659343 2.03698651344743
-#> 2             No Treatment 1.65212306626744 0.329134113146693 1.00703205841639
-#> 3                Treatment 5.11474489549336 0.527389628905355 4.08108021701892
-#> 4 Treatment - No Treatment 3.46262182922592 0.632367548388815 2.22320420939195
+#> 1                 Observed 2.56188497106099 0.263207346569584 2.04600805131825
+#> 2             No Treatment 1.65212306626744 0.267304245870594 1.12821637144643
+#> 3                Treatment 5.11474489549336 0.490898308829222 4.15260189011646
+#> 4 Treatment - No Treatment 3.46262182922592 0.469653863737132 2.54211717110106
 #>                 ul
-#> 1 3.08678342867454
-#> 2 2.29721407411848
-#> 3  6.1484095739678
-#> 4 4.70203944905989
+#> 1 3.07776189080372
+#> 2 2.17602976108844
+#> 3 6.07688790087025
+#> 4 4.38312648735078
 ```
diff --git a/docs/13-stand-gformula-stata.md b/docs/13-stand-gformula-stata.md
index 682888a..0f5b8c1 100644
--- a/docs/13-stand-gformula-stata.md
+++ b/docs/13-stand-gformula-stata.md
@@ -1,7 +1,7 @@
 # 13. Standardization and the parametric G-formula: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -20,7 +20,7 @@ For errors contact: ejmurray@bu.edu
 - Section 13.2
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /* Estimate the the conditional mean outcome within strata of quitting 
@@ -131,7 +131,7 @@ Smoking cessation  |   .0466628   .0351448     1.33   0.184    -.0222197    .115
 - Section 13.3
 
 
-```stata
+``` stata
 clear
 input str10 ID L A Y
 "Rheia" 	0 0 0 
@@ -372,7 +372,7 @@ difference          .          0
 - Section 13.3
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 *i.Data set up for standardization: create 3 copies of each subject*
@@ -624,7 +624,7 @@ file ./data/observe.mmat saved
 - Section 13.3
 
 
-```stata
+``` stata
 *Run program 13.3 to obtain point estimates, and then the code below*
 
 capture program drop bootstdz
diff --git a/docs/14-g-est-snms-r.md b/docs/14-g-est-snms-r.md
index 989ef84..95d5731 100644
--- a/docs/14-g-est-snms-r.md
+++ b/docs/14-g-est-snms-r.md
@@ -8,12 +8,12 @@
 - Data from NHEFS
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 # install.packages("readxl") # install package if required
 library("readxl")
 nhefs <- read_excel(here("data", "NHEFS.xls"))
@@ -29,6 +29,9 @@ library(Hmisc)
 #> The following objects are masked from 'package:base':
 #> 
 #>     format.pval, units
+```
+
+``` r
 describe(nhefs$wt82_71)
 #> nhefs$wt82_71 
 #>        n  missing distinct     Info     Mean      Gmd      .05      .10 
@@ -38,6 +41,9 @@ describe(nhefs$wt82_71)
 #> 
 #> lowest : -41.2805 -30.5019 -30.0501 -29.0258 -25.9706
 #> highest: 34.0178  36.9693  37.6505  47.5113  48.5384
+```
+
+``` r
 
 # estimation of denominator of ip weights for C
 cw.denom <- glm(cens==0 ~ qsmk + sex + race + age + I(age^2)
@@ -85,6 +91,9 @@ summary(cw.denom)
 #> AIC: 505.36
 #> 
 #> Number of Fisher Scoring iterations: 7
+```
+
+``` r
 nhefs$pd.c <- predict(cw.denom, nhefs, type="response")
 nhefs$wc <- ifelse(nhefs$cens==0, 1/nhefs$pd.c, NA)
 # observations with cens=1 only contribute to censoring models
@@ -100,7 +109,7 @@ nhefs$wc <- ifelse(nhefs$cens==0, 1/nhefs$pd.c, NA)
 
 ### G-estimation: Checking one possible value of psi
 
-```r
+``` r
 #install.packages("geepack")
 library("geepack")
 
@@ -113,6 +122,9 @@ fit <- geeglm(qsmk ~ sex + race + age + I(age*age) + as.factor(education)
            + wt71 + I(wt71*wt71) + Hpsi, family=binomial, data=nhefs,
            weights=wc, id=seqn, corstr="independence")
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
+```
+
+``` r
 summary(fit)
 #> 
 #> Call:
@@ -158,7 +170,7 @@ summary(fit)
 
 ### G-estimation: Checking multiple possible values of psi
 
-```r
+``` r
 #install.packages("geepack")
 grid <- seq(from = 2,to = 5, by = 0.1)
 j = 0
@@ -209,6 +221,9 @@ for (i in grid){
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
+```
+
+``` r
 Hpsi.coefs
 #>         Estimate  p-value
 #>  [1,]  0.0267219 0.001772
@@ -252,13 +267,16 @@ Hpsi.coefs
 
 ### G-estimation: Closed form estimator linear mean models #
 
-```r
+``` r
 logit.est <- glm(qsmk ~ sex + race + age + I(age^2) + as.factor(education)
                  + smokeintensity + I(smokeintensity^2) + smokeyrs
                  + I(smokeyrs^2) + as.factor(exercise) + as.factor(active)
                  + wt71 + I(wt71^2), data = nhefs, weight = wc,
                  family = binomial())
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
+```
+
+``` r
 summary(logit.est)
 #> 
 #> Call:
@@ -299,6 +317,9 @@ summary(logit.est)
 #> AIC: 1719
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 nhefs$pqsmk <- predict(logit.est, nhefs, type = "response")
 describe(nhefs$pqsmk)
 #> nhefs$pqsmk 
@@ -309,9 +330,15 @@ describe(nhefs$pqsmk)
 #> 
 #> lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059
 #> highest: 0.672083  0.686432  0.713913  0.733299  0.78914
+```
+
+``` r
 summary(nhefs$pqsmk)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>  0.0514  0.1780  0.2426  0.2622  0.3251  0.7891
+```
+
+``` r
 
 # solve sum(w_c * H(psi) * (qsmk - E[qsmk | L]))  = 0
 # for a single psi and H(psi) = wt82_71 - psi * qsmk
@@ -326,7 +353,7 @@ with(nhefs.c, sum(wc*wt82_71*(qsmk-pqsmk)) / sum(wc*qsmk*(qsmk - pqsmk)))
 
 ### G-estimation: Closed form estimator for 2-parameter model
 
-```r
+``` r
 diff = with(nhefs.c, qsmk - pqsmk)
 diff2 = with(nhefs.c, wc * diff)
 
diff --git a/docs/14-g-est-snms-stata.md b/docs/14-g-est-snms-stata.md
index f4c6d7f..5ebf097 100644
--- a/docs/14-g-est-snms-stata.md
+++ b/docs/14-g-est-snms-stata.md
@@ -1,7 +1,7 @@
 # 14. G-estimation of Structural Nested Models: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -21,7 +21,7 @@ For errors contact: ejmurray@bu.edu
 - Section 14.4
 
 
-```stata
+``` stata
 /*For Stata 15 or later, first install the extremes function using this code:*/
 * ssc install extremes 
 
@@ -156,7 +156,7 @@ file ./data/nhefs-wcens.dta saved
 - Section 14.5
 
 
-```stata
+``` stata
 use ./data/nhefs-wcens, clear
 
 /*Generate test value of Psi = 3.446*/
@@ -385,7 +385,7 @@ r31           5  -.02998926   .02998926   .00213639
 - Section 14.6
 
 
-```stata
+``` stata
 use ./data/nhefs-wcens, clear
 
 /*create weights*/
diff --git a/docs/15-prop-scores-r.md b/docs/15-prop-scores-r.md
index 0e9cea0..cd72cf3 100644
--- a/docs/15-prop-scores-r.md
+++ b/docs/15-prop-scores-r.md
@@ -8,12 +8,12 @@
 - Data from NHEFS
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 #install.packages("readxl") # install package if required
 library("readxl")
 
@@ -68,6 +68,9 @@ summary(fit)
 #> AIC: 10701
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 
 # (step 1) build the contrast matrix with all zeros
 # this function builds the blank matrix
@@ -82,6 +85,9 @@ library("multcomp")
 #> The following object is masked from 'package:MASS':
 #> 
 #>     geyser
+```
+
+``` r
 makeContrastMatrix <- function(model, nrow, names) {
   m <- matrix(0, nrow = nrow, ncol = length(coef(model)))
   colnames(m) <- names(coef(model))
@@ -151,6 +157,9 @@ K1
 #>                                                    I(qsmk * smokeintensity)
 #> Effect of Quitting Smoking at Smokeintensity of 5                         5
 #> Effect of Quitting Smoking at Smokeintensity of 40                       40
+```
+
+``` r
 
 # (step 4) estimate the contrasts, get tests and confidence intervals for them
 estimates1 <- glht(fit, K1)
@@ -174,6 +183,9 @@ estimates1 <- glht(fit, K1)
 #> ---
 #> Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
 #> (Adjusted p values reported -- single-step method)
+```
+
+``` r
   confint(estimates1)
 #> 
 #> 	 Simultaneous Confidence Intervals
@@ -192,6 +204,9 @@ estimates1 <- glht(fit, K1)
 #>                                                         Estimate lwr    upr   
 #> Effect of Quitting Smoking at Smokeintensity of 5 == 0  2.7929   1.3039 4.2819
 #> Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261   2.5372 6.3151
+```
+
+``` r
 
 # regression on covariates, not allowing for effect modification
 fit2 <- glm(wt82_71 ~ qsmk + sex + race + age + I(age*age) + as.factor(education)
@@ -248,7 +263,7 @@ summary(fit2)
 - Estimating and plotting the propensity score
 - Data from NHEFS
 
-```r
+``` r
 fit3 <- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education)
             + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs
             + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active)
@@ -292,14 +307,23 @@ summary(fit3)
 #> AIC: 1804.7
 #> 
 #> Number of Fisher Scoring iterations: 4
+```
+
+``` r
 nhefs$ps <- predict(fit3, nhefs, type="response")
 
 summary(nhefs$ps[nhefs$qsmk==0])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #> 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788
+```
+
+``` r
 summary(nhefs$ps[nhefs$qsmk==1])
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #> 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320
+```
+
+``` r
 
 # # plotting the estimated propensity score
 # install.packages("ggplot2") # install packages if necessary
@@ -317,6 +341,9 @@ library("dplyr")
 #> The following objects are masked from 'package:base':
 #> 
 #>     intersect, setdiff, setequal, union
+```
+
+``` r
 ggplot(nhefs, aes(x = ps, fill = qsmk)) + geom_density(alpha = 0.2) +
   xlab('Probability of Quitting Smoking During Follow-up') +
   ggtitle('Propensity Score Distribution by Treatment Group') +
@@ -331,7 +358,7 @@ ggplot(nhefs, aes(x = ps, fill = qsmk)) + geom_density(alpha = 0.2) +
 
 <img src="15-prop-scores-r_files/figure-epub3/unnamed-chunk-3-1.png" width="85%" style="display: block; margin: auto;" />
 
-```r
+``` r
 
 # alternative plot with histograms
 nhefs <- nhefs %>% mutate(qsmklabel = ifelse(qsmk == 1,
@@ -350,7 +377,7 @@ ggplot(nhefs, aes(x = ps, fill = as.factor(qsmk), color = as.factor(qsmk))) +
 <img src="15-prop-scores-r_files/figure-epub3/unnamed-chunk-3-2.png" width="85%" style="display: block; margin: auto;" />
 
 
-```r
+``` r
 # attempt to reproduce plot from the book
 nhefs %>%
   mutate(ps.grp = round(ps/0.05) * 0.05) %>%
@@ -376,7 +403,7 @@ nhefs %>%
 - Stratification on the propensity score
 - Data from NHEFS
 
-```r
+``` r
 # calculation of deciles
 nhefs$ps.dec <- cut(nhefs$ps,
                     breaks=c(quantile(nhefs$ps, probs=seq(0,1,0.1))),
@@ -390,6 +417,9 @@ library("psych")
 #> The following objects are masked from 'package:ggplot2':
 #> 
 #>     %+%, alpha
+```
+
+``` r
 describeBy(nhefs$ps, list(nhefs$ps.dec, nhefs$qsmk))
 #> 
 #>  Descriptive statistics by group 
@@ -492,6 +522,9 @@ describeBy(nhefs$ps, list(nhefs$ps.dec, nhefs$qsmk))
 #> : 1
 #>    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se
 #> X1    1 77 0.52 0.08   0.51    0.51 0.08 0.42 0.79  0.38 0.88     0.81 0.01
+```
+
+``` r
 
 # function to create deciles easily
 decile <- function(x) {
@@ -621,6 +654,9 @@ for (deciles in c(1:10)) {
 #> sample estimates:
 #> mean in group 0 mean in group 1 
 #>      -0.5043766       1.7358528
+```
+
+``` r
 
 # regression on PS deciles, not allowing for effect modification
 fit.psdec <- glm(wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs)
@@ -653,6 +689,9 @@ summary(fit.psdec)
 #> AIC: 10827
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 confint.lm(fit.psdec)
 #>                         2.5 %      97.5 %
 #> (Intercept)          2.556098  4.94486263
@@ -673,7 +712,7 @@ confint.lm(fit.psdec)
 - Standardization using the propensity score
 - Data from NHEFS
 
-```r
+``` r
 #install.packages("boot") # install package if required
 library("boot")
 #> 
@@ -684,6 +723,9 @@ library("boot")
 #> The following object is masked from 'package:survival':
 #> 
 #>     aml
+```
+
+``` r
 
 # standardization by propensity score, agnostic regarding effect modification
 std.ps <- function(data, indices) {
@@ -733,20 +775,20 @@ ul <- mean + qnorm(0.975)*se
 bootstrap <- data.frame(cbind(c("Observed", "No Treatment", "Treatment",
                                 "Treatment - No Treatment"), mean, se, ll, ul))
 bootstrap
-#>                         V1             mean                se               ll
-#> 1                 Observed 2.63384609228479 0.135072530918316 2.36910879638422
-#> 2             No Treatment 1.71983636149845 0.177378740872422 1.37218041776544
-#> 3                Treatment 5.35072300362985 0.282868020884392 4.79631187031832
-#> 4 Treatment - No Treatment  3.6308866421314 0.355046936099642 2.93500743455481
+#>                         V1             mean                 se               ll
+#> 1                 Observed 2.63384609228479 0.0514834573041966 2.53294037016896
+#> 2             No Treatment 1.71983636149845 0.0878957867723323 1.54756378503187
+#> 3                Treatment 5.35072300362985  0.279033038038243  4.8038282985781
+#> 4 Treatment - No Treatment  3.6308866421314  0.354972661912663 2.93515300928627
 #>                 ul
-#> 1 2.89858338818537
-#> 2 2.06749230523146
-#> 3 5.90513413694138
-#> 4 4.32676584970799
+#> 1 2.73475181440063
+#> 2 1.89210893796504
+#> 3  5.8976177086816
+#> 4 4.32662027497653
 ```
 
 
-```r
+``` r
 # regression on the propensity score (linear term)
 model6 <- glm(wt82_71 ~ qsmk + ps, data = nhefs) # p.qsmk
 summary(model6)
@@ -770,6 +812,9 @@ summary(model6)
 #> AIC: 10815
 #> 
 #> Number of Fisher Scoring iterations: 2
+```
+
+``` r
 
 # standarization on the propensity score
 # (step 1) create two new datasets, one with all treated and one with all untreated
@@ -788,10 +833,19 @@ mean1 <- mean(treated$pred.y, na.rm = TRUE)
 mean0 <- mean(untreated$pred.y, na.rm = TRUE)
 mean1
 #> [1] 5.250824
+```
+
+``` r
 mean0
 #> [1] 1.700228
+```
+
+``` r
 mean1 - mean0
 #> [1] 3.550596
+```
+
+``` r
 
 # (step 4) bootstrap a confidence interval
 # number of bootstraps
@@ -835,7 +889,7 @@ for(i in 1:nboot) {
   }
 }
 #> 95% CI for the causal mean difference
-#> 2.586126 , 4.403359
+#> 2.548285 , 4.431268
 ```
 
 A more flexible and elegant way to do this is to write a function to perform the model fitting, prediction, bootstrapping, and reporting all at once.
diff --git a/docs/15-prop-scores-stata.md b/docs/15-prop-scores-stata.md
index f7cb4aa..7cc9898 100644
--- a/docs/15-prop-scores-stata.md
+++ b/docs/15-prop-scores-stata.md
@@ -1,7 +1,7 @@
 # 15. Outcome regression and propensity scores: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -21,7 +21,7 @@ For errors contact: ejmurray@bu.edu
 - Section 15.1
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /* Generate smoking intensity among smokers product term */
@@ -172,7 +172,7 @@ regress wt82_71 qsmk c.smokeintensity##c.smokeintensity ///
 - Section 15.2
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Fit a model for the exposure, quitting smoking*/
@@ -355,7 +355,7 @@ file ./data/nhefs-ps.dta saved
 - Note: Stata decides borderline cutpoints differently from SAS, so, despite identically distributed propensity scores, the results of regression using deciles are not an exact match with the book.
 
 
-```stata
+``` stata
 use ./data/nhefs-ps, clear
 
 /*Calculation of deciles of ps*/
@@ -677,7 +677,7 @@ H0: diff = 0                                     Degrees of freedom =      154
 - Section 15.3
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Estimate the propensity score*/
diff --git a/docs/16-iv-r.md b/docs/16-iv-r.md
index e5cb938..d8bb07c 100644
--- a/docs/16-iv-r.md
+++ b/docs/16-iv-r.md
@@ -8,12 +8,12 @@
 - Data from NHEFS
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 #install.packages("readxl") # install package if required
 library("readxl")
 nhefs <- read_excel(here("data", "NHEFS.xls"))
@@ -23,6 +23,9 @@ nhefs$cens <- ifelse(is.na(nhefs$wt82), 1, 0)
 summary(nhefs$price82)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
 #>   1.452   1.740   1.815   1.806   1.868   2.103      92
+```
+
+``` r
 
 # for simplicity, ignore subjects with missing outcome or missing instrument
 nhefs.iv <- nhefs[which(!is.na(nhefs$wt82) & !is.na(nhefs$price82)),]
@@ -33,6 +36,9 @@ table(nhefs.iv$highprice, nhefs.iv$qsmk)
 #>        0    1
 #>   0   33    8
 #>   1 1065  370
+```
+
+``` r
 
 t.test(wt82_71 ~ highprice, data=nhefs.iv)
 #> 
@@ -53,7 +59,7 @@ t.test(wt82_71 ~ highprice, data=nhefs.iv)
 - Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression
 - Data from NHEFS
 
-```r
+``` r
 #install.packages ("sem") # install package if required
 library(sem)
 
@@ -75,6 +81,9 @@ summary(model1)
 #> qsmk         2.396270  19.840037 0.12078  0.90388
 #> 
 #> Residual standard error: 7.8561141 on 1474 degrees of freedom
+```
+
+``` r
 confint(model1)  # note the wide confidence intervals
 #>                  2.5 %   97.5 %
 #> (Intercept)  -7.898445 12.03477
@@ -89,7 +98,7 @@ confint(model1)  # note the wide confidence intervals
 - See Chapter 14 for program that checks several values and computes 95% confidence intervals
 
 
-```r
+``` r
 nhefs.iv$psi <- 2.396
 nhefs.iv$Hpsi <- nhefs.iv$wt82_71-nhefs.iv$psi*nhefs.iv$qsmk
 
@@ -116,6 +125,9 @@ summary(g.est)
 #>             Estimate Std.err
 #> (Intercept)        1  0.7607
 #> Number of clusters:   1476  Maximum cluster size: 1
+```
+
+``` r
 
 beta <- coef(g.est)
 SE <- coef(summary(g.est))[,2]
@@ -132,7 +144,7 @@ cbind(beta, lcl, ucl)
 - Estimating the average causal using the standard IV estimator with altnerative proposed instruments
 - Data from NHEFS
 
-```r
+``` r
 summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.6, 1, 0), data = nhefs.iv))
 #> 
 #>  2SLS Estimates
@@ -150,6 +162,9 @@ summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.6, 1, 0), data = nhefs.iv))
 #> qsmk           41.28     164.95   0.250    0.802
 #> 
 #> Residual standard error: 18.6055 on 1474 degrees of freedom
+```
+
+``` r
 summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.7, 1, 0), data = nhefs.iv))
 #> 
 #>  2SLS Estimates
@@ -167,6 +182,9 @@ summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.7, 1, 0), data = nhefs.iv))
 #> qsmk          -40.91     187.74  -0.218    0.828
 #> 
 #> Residual standard error: 20.591 on 1474 degrees of freedom
+```
+
+``` r
 summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.8, 1, 0), data = nhefs.iv))
 #> 
 #>  2SLS Estimates
@@ -184,6 +202,9 @@ summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.8, 1, 0), data = nhefs.iv))
 #> qsmk         -21.103     28.428  -0.742    0.458
 #> 
 #> Residual standard error: 13.0188 on 1474 degrees of freedom
+```
+
+``` r
 summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.9, 1, 0), data = nhefs.iv))
 #> 
 #>  2SLS Estimates
@@ -209,7 +230,7 @@ summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 >= 1.9, 1, 0), data = nhefs.iv))
 - Conditional on baseline covariates
 - Data from NHEFS
 
-```r
+``` r
 model2 <- tsls(wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs +
                       as.factor(exercise) + as.factor(active) + wt71,
              ~ highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) +
diff --git a/docs/16-iv-stata.md b/docs/16-iv-stata.md
index 364b63a..b769dc5 100644
--- a/docs/16-iv-stata.md
+++ b/docs/16-iv-stata.md
@@ -1,7 +1,7 @@
 # 16. Instrumental variables estimation: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -21,7 +21,7 @@ For errors contact: ejmurray@bu.edu
 - Section 16.2
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 summarize price82
@@ -192,7 +192,7 @@ r1   2.535729  2.6860178
 - Section 16.2
 
 
-```stata
+``` stata
 use ./data/nhefs-highprice, clear
 
 /* ivregress fits the model in two stages:
@@ -227,7 +227,7 @@ Exogenous:  highprice
 - Section 16.2
 
 
-```stata
+``` stata
 use ./data/nhefs-highprice, clear
 
 gen psi = 2.396
@@ -260,7 +260,7 @@ Log likelihood = -187.34948                             Pseudo R2     = 0.0000
 - Section 16.5
 
 
-```stata
+``` stata
 use ./data/nhefs-highprice, clear
 
 /*Instrument cut-point: 1.6*/
@@ -377,7 +377,7 @@ Exogenous:  highprice
 - Section 16.5
 
 
-```stata
+``` stata
 use ./data/nhefs-highprice, clear
 
 replace highprice = .
diff --git a/docs/17-causal-surv-r.md b/docs/17-causal-surv-r.md
index f826c42..38283a2 100644
--- a/docs/17-causal-surv-r.md
+++ b/docs/17-causal-surv-r.md
@@ -7,12 +7,12 @@
 - Nonparametric estimation of survival curves
 - Data from NHEFS
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 library("readxl")
 nhefs <- read_excel(here("data","NHEFS.xls"))
 
@@ -25,9 +25,15 @@ table(nhefs$death, nhefs$qsmk)
 #>       0   1
 #>   0 985 326
 #>   1 216 102
+```
+
+``` r
 summary(nhefs[which(nhefs$death==1),]$survtime)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>    1.00   35.00   61.00   61.14   86.75  120.00
+```
+
+``` r
 
 #install.packages("survival")
 #install.packages("ggplot2") # for plots
@@ -41,6 +47,9 @@ library("survminer")
 #> The following object is masked from 'package:survival':
 #> 
 #>     myeloma
+```
+
+``` r
 survdiff(Surv(survtime, death) ~ qsmk, data=nhefs)
 #> Call:
 #> survdiff(formula = Surv(survtime, death) ~ qsmk, data = nhefs)
@@ -50,6 +59,9 @@ survdiff(Surv(survtime, death) ~ qsmk, data=nhefs)
 #> qsmk=1  428      102     80.5      5.76      7.73
 #> 
 #>  Chisq= 7.7  on 1 degrees of freedom, p= 0.005
+```
+
+``` r
 
 fit <- survfit(Surv(survtime, death) ~ qsmk, data=nhefs)
 ggsurvplot(fit, data = nhefs, xlab="Months of follow-up",
@@ -65,7 +77,7 @@ ggsurvplot(fit, data = nhefs, xlab="Months of follow-up",
 - Data from NHEFS
 
 
-```r
+``` r
 # creation of person-month data
 #install.packages("splitstackshape")
 library("splitstackshape")
@@ -102,6 +114,9 @@ summary(hazards.model)
 #> AIC: 4643.3
 #> 
 #> Number of Fisher Scoring iterations: 9
+```
+
+``` r
 
 # creation of dataset with all time points under each treatment level
 qsmk0 <- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2))
@@ -143,7 +158,7 @@ ggplot(hazards.graph, aes(x=time, y=surv)) +
 - Estimation of survival curves via IP weighted hazards model
 - Data from NHEFS
 
-```r
+``` r
 # estimation of denominator of ip weights
 p.denom <- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education)
                + smokeintensity + I(smokeintensity*smokeintensity)
@@ -162,6 +177,9 @@ nhefs$sw.a <- ifelse(nhefs$qsmk==1, nhefs$pn.qsmk/nhefs$pd.qsmk,
 summary(nhefs$sw.a)
 #>    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 #>  0.3312  0.8640  0.9504  0.9991  1.0755  4.2054
+```
+
+``` r
 
 # creation of person-month data
 nhefs.ipw <- expandRows(nhefs, "survtime", drop=F)
@@ -175,6 +193,9 @@ ipw.model <- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) +
                    time + timesq, family=binomial(), weight=sw.a,
                  data=nhefs.ipw)
 #> Warning in eval(family$initialize): non-integer #successes in a binomial glm!
+```
+
+``` r
 summary(ipw.model)
 #> 
 #> Call:
@@ -199,6 +220,9 @@ summary(ipw.model)
 #> AIC: 4633.5
 #> 
 #> Number of Fisher Scoring iterations: 9
+```
+
+``` r
 
 # creation of survival curves
 ipw.qsmk0 <- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2))
@@ -240,7 +264,7 @@ ggplot(ipw.graph, aes(x=time, y=surv)) +
 - Estimating of survival curves via g-formula
 - Data from NHEFS
 
-```r
+``` r
 # fit of hazards model with covariates
 gf.model <- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq)
                 + time + timesq + sex + race + age + I(age*age)
@@ -296,6 +320,9 @@ summary(gf.model)
 #> AIC: 4235.7
 #> 
 #> Number of Fisher Scoring iterations: 10
+```
+
+``` r
 
 # creation of dataset with all time points for
 # each individual under each treatment level
@@ -320,6 +347,9 @@ library("dplyr")
 #> The following objects are masked from 'package:base':
 #> 
 #>     intersect, setdiff, setequal, union
+```
+
+``` r
 gf.qsmk0.surv <- gf.qsmk0 %>% group_by(seqn) %>% mutate(surv0 = cumprod(p.noevent0))
 gf.qsmk1.surv <- gf.qsmk1 %>% group_by(seqn) %>% mutate(surv1 = cumprod(p.noevent1))
 
@@ -356,7 +386,7 @@ ggplot(gf.graph, aes(x=time, y=surv)) +
 - Estimating of median survival time ratio via a structural nested AFT model
 - Data from NHEFS
 
-```r
+``` r
 # some preprocessing of the data
 nhefs <- read_excel(here("data", "NHEFS.xls"))
 nhefs$survtime <-
diff --git a/docs/17-causal-surv-stata.md b/docs/17-causal-surv-stata.md
index ef6e817..8ee9700 100644
--- a/docs/17-causal-surv-stata.md
+++ b/docs/17-causal-surv-stata.md
@@ -1,7 +1,7 @@
 # 17. Causal survival analysis: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
@@ -21,7 +21,7 @@ For errors contact: ejmurray@bu.edu
 - Section 17.1
 
 
-```stata
+``` stata
 use ./data/nhefs-formatted, clear
 
 /*Some preprocessing of the data*/
@@ -88,7 +88,7 @@ Observed time interval: (0, survtime]
 - Generates Figure 17.4
 
 
-```stata
+``` stata
 /**Create person-month dataset for survival analyses**/
 
 /* We want our new dataset to include 1 observation per person 
@@ -288,7 +288,7 @@ psurv1          float   %9.0g                 psurv, interv == Duplicated observ
 - Generates Figure 17.6
 
 
-```stata
+``` stata
 use ./data/nhefs_surv, clear
 
 keep seqn event qsmk time sex race age education ///
@@ -620,7 +620,7 @@ psurv1          float   %9.0g                 psurv, interv == Duplicated observ
  26. drop if newseqn != 1  /* only need one pair */
  27.         
 
-r; t=0.00 14:53:12
+r; t=0.00 6:54:29
 
       Command: bootipw_surv
        PrY_a0: r(boot_0)
@@ -628,7 +628,7 @@ r; t=0.00 14:53:12
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=18.60 14:53:30
+r; t=19.55 6:54:48
 
 
 
@@ -656,7 +656,7 @@ Bootstrap results                                        Number of obs = 1,629
 - Generates Figure 17.7
 
 
-```stata
+``` stata
 use ./data/nhefs_surv, clear
 
 keep seqn event qsmk time sex race age education ///
@@ -855,7 +855,7 @@ meanS_t1        float   %9.0g                 meanS_t, interv == Duplicated
                                                 observation
 
 
-file /Users/eptmp/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
+file /Users/tom/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
     format
 
 (3,132 observations deleted)
@@ -866,7 +866,7 @@ file /Users/eptmp/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as P
   5. drop if time != 0       
   6. /*only predict on new version of data */
 
-r; t=0.00 14:53:37
+r; t=0.00 6:54:56
 
       Command: bootstdz_surv
        PrY_a0: r(boot_0)
@@ -874,7 +874,7 @@ r; t=0.00 14:53:37
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=21.18 14:53:58
+r; t=23.54 6:55:20
 
 
 
diff --git a/docs/18-session-info-r.md b/docs/18-session-info-r.md
index e4d9346..cbe7207 100644
--- a/docs/18-session-info-r.md
+++ b/docs/18-session-info-r.md
@@ -4,36 +4,36 @@
 
 For reproducibility.
 
-```r
+``` r
 # install.packages("sessioninfo")
 sessioninfo::session_info()
 #> ─ Session info ───────────────────────────────────────────────────────────────
 #>  setting  value
-#>  version  R version 4.4.0 (2024-04-24)
-#>  os       macOS Sonoma 14.4.1
+#>  version  R version 4.4.1 (2024-06-14)
+#>  os       macOS Sonoma 14.5
 #>  system   aarch64, darwin20
 #>  ui       X11
 #>  language (EN)
 #>  collate  en_US.UTF-8
 #>  ctype    en_US.UTF-8
 #>  tz       Europe/London
-#>  date     2024-04-25
-#>  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)
+#>  date     2024-06-16
+#>  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)
 #> 
 #> ─ Packages ───────────────────────────────────────────────────────────────────
 #>  package     * version date (UTC) lib source
 #>  bookdown      0.39    2024-04-15 [1] CRAN (R 4.4.0)
 #>  cli           3.6.2   2023-12-11 [1] CRAN (R 4.4.0)
 #>  digest        0.6.35  2024-03-11 [1] CRAN (R 4.4.0)
-#>  evaluate      0.23    2023-11-01 [1] CRAN (R 4.4.0)
-#>  fastmap       1.1.1   2023-02-24 [1] CRAN (R 4.4.0)
+#>  evaluate      0.24.0  2024-06-10 [1] CRAN (R 4.4.0)
+#>  fastmap       1.2.0   2024-05-15 [1] CRAN (R 4.4.0)
 #>  htmltools     0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)
-#>  knitr         1.46    2024-04-06 [1] CRAN (R 4.4.0)
-#>  rlang         1.1.3   2024-01-10 [1] CRAN (R 4.4.0)
-#>  rmarkdown     2.26    2024-03-05 [1] CRAN (R 4.4.0)
+#>  knitr         1.47    2024-05-29 [1] CRAN (R 4.4.0)
+#>  rlang         1.1.4   2024-06-04 [1] CRAN (R 4.4.0)
+#>  rmarkdown     2.27    2024-05-17 [1] CRAN (R 4.4.0)
 #>  rstudioapi    0.16.0  2024-03-24 [1] CRAN (R 4.4.0)
 #>  sessioninfo   1.2.2   2021-12-06 [1] CRAN (R 4.4.0)
-#>  xfun          0.43    2024-03-25 [1] CRAN (R 4.4.0)
+#>  xfun          0.44    2024-05-15 [1] CRAN (R 4.4.0)
 #>  yaml          2.3.8   2023-12-11 [1] CRAN (R 4.4.0)
 #> 
 #>  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library
diff --git a/docs/18-session-info-stata.md b/docs/18-session-info-stata.md
index 7465f3b..f2383f1 100644
--- a/docs/18-session-info-stata.md
+++ b/docs/18-session-info-stata.md
@@ -1,23 +1,23 @@
 # Session information: Stata{-}
 
 
-```r
+``` r
 library(Statamarkdown)
 ```
 
 For reproducibility.
 
 
-```stata
+``` stata
 about
 ```
 
 ```
-Stata/MP 18.0 for Mac (Apple Silicon)
-Revision 04 Apr 2024
+StataNow/MP 18.5 for Mac (Apple Silicon)
+Revision 22 May 2024
 Copyright 1985-2023 StataCorp LLC
 
-Total physical memory: 18.00 GB
+Total physical memory: 8.01 GB
 
 Stata license: Unlimited-user 2-core network, expiring 29 Jan 2025
 Serial number: 501809305331
@@ -26,37 +26,37 @@ Serial number: 501809305331
 ```
 
 
-```r
+``` r
 # install.packages("sessioninfo")
 sessioninfo::session_info()
 #> ─ Session info ───────────────────────────────────────────────────────────────
 #>  setting  value
-#>  version  R version 4.4.0 (2024-04-24)
-#>  os       macOS Sonoma 14.4.1
+#>  version  R version 4.4.1 (2024-06-14)
+#>  os       macOS Sonoma 14.5
 #>  system   aarch64, darwin20
 #>  ui       X11
 #>  language (EN)
 #>  collate  en_US.UTF-8
 #>  ctype    en_US.UTF-8
 #>  tz       Europe/London
-#>  date     2024-04-25
-#>  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)
+#>  date     2024-06-16
+#>  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)
 #> 
 #> ─ Packages ───────────────────────────────────────────────────────────────────
 #>  package       * version date (UTC) lib source
 #>  bookdown        0.39    2024-04-15 [1] CRAN (R 4.4.0)
 #>  cli             3.6.2   2023-12-11 [1] CRAN (R 4.4.0)
 #>  digest          0.6.35  2024-03-11 [1] CRAN (R 4.4.0)
-#>  evaluate        0.23    2023-11-01 [1] CRAN (R 4.4.0)
-#>  fastmap         1.1.1   2023-02-24 [1] CRAN (R 4.4.0)
+#>  evaluate        0.24.0  2024-06-10 [1] CRAN (R 4.4.0)
+#>  fastmap         1.2.0   2024-05-15 [1] CRAN (R 4.4.0)
 #>  htmltools       0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)
-#>  knitr           1.46    2024-04-06 [1] CRAN (R 4.4.0)
-#>  rlang           1.1.3   2024-01-10 [1] CRAN (R 4.4.0)
-#>  rmarkdown       2.26    2024-03-05 [1] CRAN (R 4.4.0)
+#>  knitr           1.47    2024-05-29 [1] CRAN (R 4.4.0)
+#>  rlang           1.1.4   2024-06-04 [1] CRAN (R 4.4.0)
+#>  rmarkdown       2.27    2024-05-17 [1] CRAN (R 4.4.0)
 #>  rstudioapi      0.16.0  2024-03-24 [1] CRAN (R 4.4.0)
 #>  sessioninfo     1.2.2   2021-12-06 [1] CRAN (R 4.4.0)
 #>  Statamarkdown * 0.9.2   2023-12-04 [1] CRAN (R 4.4.0)
-#>  xfun            0.43    2024-03-25 [1] CRAN (R 4.4.0)
+#>  xfun            0.44    2024-05-15 [1] CRAN (R 4.4.0)
 #>  yaml            2.3.8   2023-12-11 [1] CRAN (R 4.4.0)
 #> 
 #>  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library
diff --git a/docs/404.html b/docs/404.html
index 6f0c79d..11b6b28 100644
--- a/docs/404.html
+++ b/docs/404.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
diff --git a/docs/causal-survival-analysis-stata.html b/docs/causal-survival-analysis-stata.html
index 55d33f5..714f3f5 100644
--- a/docs/causal-survival-analysis-stata.html
+++ b/docs/causal-survival-analysis-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="causal-survival-analysis-stata" class="section level1 unnumbered hasAnchor">
 <h1>17. Causal survival analysis: Stata<a href="causal-survival-analysis-stata.html#causal-survival-analysis-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb124"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb124-1"><a href="causal-survival-analysis-stata.html#cb124-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb241"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb241-1"><a href="causal-survival-analysis-stata.html#cb241-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -324,21 +324,21 @@ <h2>Program 17.1<a href="causal-survival-analysis-stata.html#program-17.1-1" cla
 <li>Data from NHEFS</li>
 <li>Section 17.1</li>
 </ul>
-<div class="sourceCode" id="cb126"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb126-1"><a href="causal-survival-analysis-stata.html#cb126-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb126-2"><a href="causal-survival-analysis-stata.html#cb126-2" tabindex="-1"></a></span>
-<span id="cb126-3"><a href="causal-survival-analysis-stata.html#cb126-3" tabindex="-1"></a><span class="co">/*Some preprocessing of the data*/</span></span>
-<span id="cb126-4"><a href="causal-survival-analysis-stata.html#cb126-4" tabindex="-1"></a><span class="kw">gen</span> survtime = .</span>
-<span id="cb126-5"><a href="causal-survival-analysis-stata.html#cb126-5" tabindex="-1"></a><span class="kw">replace</span> survtime = 120 <span class="kw">if</span> death == 0</span>
-<span id="cb126-6"><a href="causal-survival-analysis-stata.html#cb126-6" tabindex="-1"></a><span class="kw">replace</span> survtime = (yrdth - 83)*12 + modth <span class="kw">if</span> death ==1</span>
-<span id="cb126-7"><a href="causal-survival-analysis-stata.html#cb126-7" tabindex="-1"></a>* yrdth ranges from 83 to 92*</span>
-<span id="cb126-8"><a href="causal-survival-analysis-stata.html#cb126-8" tabindex="-1"></a></span>
-<span id="cb126-9"><a href="causal-survival-analysis-stata.html#cb126-9" tabindex="-1"></a><span class="kw">tab</span> death qsmk</span>
-<span id="cb126-10"><a href="causal-survival-analysis-stata.html#cb126-10" tabindex="-1"></a></span>
-<span id="cb126-11"><a href="causal-survival-analysis-stata.html#cb126-11" tabindex="-1"></a><span class="co">/*Kaplan-Meier graph of observed survival over time, by quitting smoking*/</span></span>
-<span id="cb126-12"><a href="causal-survival-analysis-stata.html#cb126-12" tabindex="-1"></a>*For now, we <span class="kw">use</span> the <span class="kw">stset</span> <span class="kw">function</span> <span class="kw">in</span> Stata*</span>
-<span id="cb126-13"><a href="causal-survival-analysis-stata.html#cb126-13" tabindex="-1"></a><span class="kw">stset</span> survtime, failure(death=1)</span>
-<span id="cb126-14"><a href="causal-survival-analysis-stata.html#cb126-14" tabindex="-1"></a><span class="kw">sts</span> <span class="kw">graph</span>, <span class="kw">by</span>(qsmk) <span class="kw">xlabel</span>(0(12)120)</span>
-<span id="cb126-15"><a href="causal-survival-analysis-stata.html#cb126-15" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-1.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb243"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb243-1"><a href="causal-survival-analysis-stata.html#cb243-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb243-2"><a href="causal-survival-analysis-stata.html#cb243-2" tabindex="-1"></a></span>
+<span id="cb243-3"><a href="causal-survival-analysis-stata.html#cb243-3" tabindex="-1"></a><span class="co">/*Some preprocessing of the data*/</span></span>
+<span id="cb243-4"><a href="causal-survival-analysis-stata.html#cb243-4" tabindex="-1"></a><span class="kw">gen</span> survtime = .</span>
+<span id="cb243-5"><a href="causal-survival-analysis-stata.html#cb243-5" tabindex="-1"></a><span class="kw">replace</span> survtime = 120 <span class="kw">if</span> death == 0</span>
+<span id="cb243-6"><a href="causal-survival-analysis-stata.html#cb243-6" tabindex="-1"></a><span class="kw">replace</span> survtime = (yrdth - 83)*12 + modth <span class="kw">if</span> death ==1</span>
+<span id="cb243-7"><a href="causal-survival-analysis-stata.html#cb243-7" tabindex="-1"></a>* yrdth ranges from 83 to 92*</span>
+<span id="cb243-8"><a href="causal-survival-analysis-stata.html#cb243-8" tabindex="-1"></a></span>
+<span id="cb243-9"><a href="causal-survival-analysis-stata.html#cb243-9" tabindex="-1"></a><span class="kw">tab</span> death qsmk</span>
+<span id="cb243-10"><a href="causal-survival-analysis-stata.html#cb243-10" tabindex="-1"></a></span>
+<span id="cb243-11"><a href="causal-survival-analysis-stata.html#cb243-11" tabindex="-1"></a><span class="co">/*Kaplan-Meier graph of observed survival over time, by quitting smoking*/</span></span>
+<span id="cb243-12"><a href="causal-survival-analysis-stata.html#cb243-12" tabindex="-1"></a>*For now, we <span class="kw">use</span> the <span class="kw">stset</span> <span class="kw">function</span> <span class="kw">in</span> Stata*</span>
+<span id="cb243-13"><a href="causal-survival-analysis-stata.html#cb243-13" tabindex="-1"></a><span class="kw">stset</span> survtime, failure(death=1)</span>
+<span id="cb243-14"><a href="causal-survival-analysis-stata.html#cb243-14" tabindex="-1"></a><span class="kw">sts</span> <span class="kw">graph</span>, <span class="kw">by</span>(qsmk) <span class="kw">xlabel</span>(0(12)120)</span>
+<span id="cb243-15"><a href="causal-survival-analysis-stata.html#cb243-15" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-1.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>(1,566 missing values generated)
 
 (1,275 real changes made)
@@ -385,92 +385,92 @@ <h2>Program 17.2<a href="causal-survival-analysis-stata.html#program-17.2-1" cla
 <li>Section 17.1</li>
 <li>Generates Figure 17.4</li>
 </ul>
-<div class="sourceCode" id="cb128"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb128-1"><a href="causal-survival-analysis-stata.html#cb128-1" tabindex="-1"></a><span class="co">/**Create person-month dataset for survival analyses**/</span></span>
-<span id="cb128-2"><a href="causal-survival-analysis-stata.html#cb128-2" tabindex="-1"></a></span>
-<span id="cb128-3"><a href="causal-survival-analysis-stata.html#cb128-3" tabindex="-1"></a><span class="co">/* We want our new dataset to include 1 observation per person </span></span>
-<span id="cb128-4"><a href="causal-survival-analysis-stata.html#cb128-4" tabindex="-1"></a><span class="co">per month alive, starting at time = 0.</span></span>
-<span id="cb128-5"><a href="causal-survival-analysis-stata.html#cb128-5" tabindex="-1"></a><span class="co">Individuals who survive to the end of follow-up will have </span></span>
-<span id="cb128-6"><a href="causal-survival-analysis-stata.html#cb128-6" tabindex="-1"></a><span class="co">119 time points</span></span>
-<span id="cb128-7"><a href="causal-survival-analysis-stata.html#cb128-7" tabindex="-1"></a><span class="co">Individuals who die will have survtime - 1 time points*/</span></span>
-<span id="cb128-8"><a href="causal-survival-analysis-stata.html#cb128-8" tabindex="-1"></a></span>
-<span id="cb128-9"><a href="causal-survival-analysis-stata.html#cb128-9" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb128-10"><a href="causal-survival-analysis-stata.html#cb128-10" tabindex="-1"></a></span>
-<span id="cb128-11"><a href="causal-survival-analysis-stata.html#cb128-11" tabindex="-1"></a><span class="kw">gen</span> survtime = .</span>
-<span id="cb128-12"><a href="causal-survival-analysis-stata.html#cb128-12" tabindex="-1"></a><span class="kw">replace</span> survtime = 120 <span class="kw">if</span> death == 0</span>
-<span id="cb128-13"><a href="causal-survival-analysis-stata.html#cb128-13" tabindex="-1"></a><span class="kw">replace</span> survtime = (yrdth - 83)*12 + modth <span class="kw">if</span> death ==1</span>
-<span id="cb128-14"><a href="causal-survival-analysis-stata.html#cb128-14" tabindex="-1"></a></span>
-<span id="cb128-15"><a href="causal-survival-analysis-stata.html#cb128-15" tabindex="-1"></a>*expand <span class="kw">data</span> to person-time*</span>
-<span id="cb128-16"><a href="causal-survival-analysis-stata.html#cb128-16" tabindex="-1"></a><span class="kw">gen</span> time = 0</span>
-<span id="cb128-17"><a href="causal-survival-analysis-stata.html#cb128-17" tabindex="-1"></a>expand survtime <span class="kw">if</span> time == 0</span>
-<span id="cb128-18"><a href="causal-survival-analysis-stata.html#cb128-18" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1</span>
-<span id="cb128-19"><a href="causal-survival-analysis-stata.html#cb128-19" tabindex="-1"></a></span>
-<span id="cb128-20"><a href="causal-survival-analysis-stata.html#cb128-20" tabindex="-1"></a>*Create event <span class="kw">variable</span>*</span>
-<span id="cb128-21"><a href="causal-survival-analysis-stata.html#cb128-21" tabindex="-1"></a><span class="kw">gen</span> event = 0</span>
-<span id="cb128-22"><a href="causal-survival-analysis-stata.html#cb128-22" tabindex="-1"></a><span class="kw">replace</span> event = 1 <span class="kw">if</span> time == survtime - 1 &amp; death == 1</span>
-<span id="cb128-23"><a href="causal-survival-analysis-stata.html#cb128-23" tabindex="-1"></a><span class="kw">tab</span> event</span>
-<span id="cb128-24"><a href="causal-survival-analysis-stata.html#cb128-24" tabindex="-1"></a></span>
-<span id="cb128-25"><a href="causal-survival-analysis-stata.html#cb128-25" tabindex="-1"></a>*Create time-squared <span class="kw">variable</span> <span class="kw">for</span> analyses*</span>
-<span id="cb128-26"><a href="causal-survival-analysis-stata.html#cb128-26" tabindex="-1"></a><span class="kw">gen</span> timesq = time*time</span>
-<span id="cb128-27"><a href="causal-survival-analysis-stata.html#cb128-27" tabindex="-1"></a></span>
-<span id="cb128-28"><a href="causal-survival-analysis-stata.html#cb128-28" tabindex="-1"></a>*Save the dataset to your working directory <span class="kw">for</span> future <span class="kw">use</span>*</span>
-<span id="cb128-29"><a href="causal-survival-analysis-stata.html#cb128-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">replace</span></span>
-<span id="cb128-30"><a href="causal-survival-analysis-stata.html#cb128-30" tabindex="-1"></a></span>
-<span id="cb128-31"><a href="causal-survival-analysis-stata.html#cb128-31" tabindex="-1"></a><span class="co">/**Hazard ratios**/</span></span>
-<span id="cb128-32"><a href="causal-survival-analysis-stata.html#cb128-32" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
-<span id="cb128-33"><a href="causal-survival-analysis-stata.html#cb128-33" tabindex="-1"></a></span>
-<span id="cb128-34"><a href="causal-survival-analysis-stata.html#cb128-34" tabindex="-1"></a>*Fit a pooled <span class="kw">logistic</span> hazards <span class="kw">model</span> *</span>
-<span id="cb128-35"><a href="causal-survival-analysis-stata.html#cb128-35" tabindex="-1"></a><span class="kw">logistic</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
-<span id="cb128-36"><a href="causal-survival-analysis-stata.html#cb128-36" tabindex="-1"></a>  c.time c.time#c.time </span>
-<span id="cb128-37"><a href="causal-survival-analysis-stata.html#cb128-37" tabindex="-1"></a></span>
-<span id="cb128-38"><a href="causal-survival-analysis-stata.html#cb128-38" tabindex="-1"></a><span class="co">/**Survival curves: run regression then do:**/</span></span>
-<span id="cb128-39"><a href="causal-survival-analysis-stata.html#cb128-39" tabindex="-1"></a></span>
-<span id="cb128-40"><a href="causal-survival-analysis-stata.html#cb128-40" tabindex="-1"></a>*Create a dataset with <span class="ot">all</span> time points under each treatment <span class="dv">level</span>*</span>
-<span id="cb128-41"><a href="causal-survival-analysis-stata.html#cb128-41" tabindex="-1"></a>*Re-expand <span class="kw">data</span> with <span class="bn">rows</span> <span class="kw">for</span> <span class="ot">all</span> timepoints*</span>
-<span id="cb128-42"><a href="causal-survival-analysis-stata.html#cb128-42" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
-<span id="cb128-43"><a href="causal-survival-analysis-stata.html#cb128-43" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
-<span id="cb128-44"><a href="causal-survival-analysis-stata.html#cb128-44" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1   </span>
-<span id="cb128-45"><a href="causal-survival-analysis-stata.html#cb128-45" tabindex="-1"></a>        </span>
-<span id="cb128-46"><a href="causal-survival-analysis-stata.html#cb128-46" tabindex="-1"></a><span class="co">/*Create 2 copies of each subject, and set outcome to missing </span></span>
-<span id="cb128-47"><a href="causal-survival-analysis-stata.html#cb128-47" tabindex="-1"></a><span class="co">and treatment -- use only the newobs*/</span></span>
-<span id="cb128-48"><a href="causal-survival-analysis-stata.html#cb128-48" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
-<span id="cb128-49"><a href="causal-survival-analysis-stata.html#cb128-49" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv   </span>
-<span id="cb128-50"><a href="causal-survival-analysis-stata.html#cb128-50" tabindex="-1"></a></span>
-<span id="cb128-51"><a href="causal-survival-analysis-stata.html#cb128-51" tabindex="-1"></a><span class="co">/*Generate predicted event and survival probabilities </span></span>
-<span id="cb128-52"><a href="causal-survival-analysis-stata.html#cb128-52" tabindex="-1"></a><span class="co">for each person each month in copies*/</span></span>
-<span id="cb128-53"><a href="causal-survival-analysis-stata.html#cb128-53" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
-<span id="cb128-54"><a href="causal-survival-analysis-stata.html#cb128-54" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
-<span id="cb128-55"><a href="causal-survival-analysis-stata.html#cb128-55" tabindex="-1"></a><span class="kw">keep</span> seqn time qsmk interv psurv_k </span>
-<span id="cb128-56"><a href="causal-survival-analysis-stata.html#cb128-56" tabindex="-1"></a></span>
-<span id="cb128-57"><a href="causal-survival-analysis-stata.html#cb128-57" tabindex="-1"></a>*Within copies, <span class="kw">generate</span> predicted survival <span class="bn">over</span> time*</span>
-<span id="cb128-58"><a href="causal-survival-analysis-stata.html#cb128-58" tabindex="-1"></a>*Remember, survival is the product <span class="kw">of</span> conditional survival probabilities <span class="kw">in</span> each interval*  </span>
-<span id="cb128-59"><a href="causal-survival-analysis-stata.html#cb128-59" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
-<span id="cb128-60"><a href="causal-survival-analysis-stata.html#cb128-60" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
-<span id="cb128-61"><a href="causal-survival-analysis-stata.html#cb128-61" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
-<span id="cb128-62"><a href="causal-survival-analysis-stata.html#cb128-62" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
-<span id="cb128-63"><a href="causal-survival-analysis-stata.html#cb128-63" tabindex="-1"></a></span>
-<span id="cb128-64"><a href="causal-survival-analysis-stata.html#cb128-64" tabindex="-1"></a>*Display 10-<span class="fu">year</span> standardized survival, under interventions*</span>
-<span id="cb128-65"><a href="causal-survival-analysis-stata.html#cb128-65" tabindex="-1"></a>*Note: since time starts <span class="fu">at</span> 0, <span class="fu">month</span> 119 is 10-<span class="fu">year</span> survival*</span>
-<span id="cb128-66"><a href="causal-survival-analysis-stata.html#cb128-66" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
-<span id="cb128-67"><a href="causal-survival-analysis-stata.html#cb128-67" tabindex="-1"></a></span>
-<span id="cb128-68"><a href="causal-survival-analysis-stata.html#cb128-68" tabindex="-1"></a>*Graph <span class="kw">of</span> standardized survival <span class="bn">over</span> time, under interventions*</span>
-<span id="cb128-69"><a href="causal-survival-analysis-stata.html#cb128-69" tabindex="-1"></a><span class="co">/*Note, we want our graph to start at 100% survival, </span></span>
-<span id="cb128-70"><a href="causal-survival-analysis-stata.html#cb128-70" tabindex="-1"></a><span class="co">so add an extra time point with P(surv) = 1*/</span></span>
-<span id="cb128-71"><a href="causal-survival-analysis-stata.html#cb128-71" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
-<span id="cb128-72"><a href="causal-survival-analysis-stata.html#cb128-72" tabindex="-1"></a><span class="kw">replace</span> psurv  = 1 <span class="kw">if</span> newtime == 1</span>
-<span id="cb128-73"><a href="causal-survival-analysis-stata.html#cb128-73" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
-<span id="cb128-74"><a href="causal-survival-analysis-stata.html#cb128-74" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
-<span id="cb128-75"><a href="causal-survival-analysis-stata.html#cb128-75" tabindex="-1"></a></span>
-<span id="cb128-76"><a href="causal-survival-analysis-stata.html#cb128-76" tabindex="-1"></a><span class="co">/*Separate the survival probabilities to allow plotting by </span></span>
-<span id="cb128-77"><a href="causal-survival-analysis-stata.html#cb128-77" tabindex="-1"></a><span class="co">intervention on qsmk*/</span></span>
-<span id="cb128-78"><a href="causal-survival-analysis-stata.html#cb128-78" tabindex="-1"></a><span class="kw">separate</span> psurv, <span class="kw">by</span>(interv)</span>
-<span id="cb128-79"><a href="causal-survival-analysis-stata.html#cb128-79" tabindex="-1"></a></span>
-<span id="cb128-80"><a href="causal-survival-analysis-stata.html#cb128-80" tabindex="-1"></a>*Plot the curves*</span>
-<span id="cb128-81"><a href="causal-survival-analysis-stata.html#cb128-81" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> psurv0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
-<span id="cb128-82"><a href="causal-survival-analysis-stata.html#cb128-82" tabindex="-1"></a>  (<span class="kw">line</span> psurv1 time2, <span class="kw">sort</span>) <span class="kw">if</span> interv &gt; -1 <span class="co">///</span></span>
-<span id="cb128-83"><a href="causal-survival-analysis-stata.html#cb128-83" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
-<span id="cb128-84"><a href="causal-survival-analysis-stata.html#cb128-84" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
-<span id="cb128-85"><a href="causal-survival-analysis-stata.html#cb128-85" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
-<span id="cb128-86"><a href="causal-survival-analysis-stata.html#cb128-86" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-2.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb245"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb245-1"><a href="causal-survival-analysis-stata.html#cb245-1" tabindex="-1"></a><span class="co">/**Create person-month dataset for survival analyses**/</span></span>
+<span id="cb245-2"><a href="causal-survival-analysis-stata.html#cb245-2" tabindex="-1"></a></span>
+<span id="cb245-3"><a href="causal-survival-analysis-stata.html#cb245-3" tabindex="-1"></a><span class="co">/* We want our new dataset to include 1 observation per person </span></span>
+<span id="cb245-4"><a href="causal-survival-analysis-stata.html#cb245-4" tabindex="-1"></a><span class="co">per month alive, starting at time = 0.</span></span>
+<span id="cb245-5"><a href="causal-survival-analysis-stata.html#cb245-5" tabindex="-1"></a><span class="co">Individuals who survive to the end of follow-up will have </span></span>
+<span id="cb245-6"><a href="causal-survival-analysis-stata.html#cb245-6" tabindex="-1"></a><span class="co">119 time points</span></span>
+<span id="cb245-7"><a href="causal-survival-analysis-stata.html#cb245-7" tabindex="-1"></a><span class="co">Individuals who die will have survtime - 1 time points*/</span></span>
+<span id="cb245-8"><a href="causal-survival-analysis-stata.html#cb245-8" tabindex="-1"></a></span>
+<span id="cb245-9"><a href="causal-survival-analysis-stata.html#cb245-9" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb245-10"><a href="causal-survival-analysis-stata.html#cb245-10" tabindex="-1"></a></span>
+<span id="cb245-11"><a href="causal-survival-analysis-stata.html#cb245-11" tabindex="-1"></a><span class="kw">gen</span> survtime = .</span>
+<span id="cb245-12"><a href="causal-survival-analysis-stata.html#cb245-12" tabindex="-1"></a><span class="kw">replace</span> survtime = 120 <span class="kw">if</span> death == 0</span>
+<span id="cb245-13"><a href="causal-survival-analysis-stata.html#cb245-13" tabindex="-1"></a><span class="kw">replace</span> survtime = (yrdth - 83)*12 + modth <span class="kw">if</span> death ==1</span>
+<span id="cb245-14"><a href="causal-survival-analysis-stata.html#cb245-14" tabindex="-1"></a></span>
+<span id="cb245-15"><a href="causal-survival-analysis-stata.html#cb245-15" tabindex="-1"></a>*expand <span class="kw">data</span> to person-time*</span>
+<span id="cb245-16"><a href="causal-survival-analysis-stata.html#cb245-16" tabindex="-1"></a><span class="kw">gen</span> time = 0</span>
+<span id="cb245-17"><a href="causal-survival-analysis-stata.html#cb245-17" tabindex="-1"></a>expand survtime <span class="kw">if</span> time == 0</span>
+<span id="cb245-18"><a href="causal-survival-analysis-stata.html#cb245-18" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1</span>
+<span id="cb245-19"><a href="causal-survival-analysis-stata.html#cb245-19" tabindex="-1"></a></span>
+<span id="cb245-20"><a href="causal-survival-analysis-stata.html#cb245-20" tabindex="-1"></a>*Create event <span class="kw">variable</span>*</span>
+<span id="cb245-21"><a href="causal-survival-analysis-stata.html#cb245-21" tabindex="-1"></a><span class="kw">gen</span> event = 0</span>
+<span id="cb245-22"><a href="causal-survival-analysis-stata.html#cb245-22" tabindex="-1"></a><span class="kw">replace</span> event = 1 <span class="kw">if</span> time == survtime - 1 &amp; death == 1</span>
+<span id="cb245-23"><a href="causal-survival-analysis-stata.html#cb245-23" tabindex="-1"></a><span class="kw">tab</span> event</span>
+<span id="cb245-24"><a href="causal-survival-analysis-stata.html#cb245-24" tabindex="-1"></a></span>
+<span id="cb245-25"><a href="causal-survival-analysis-stata.html#cb245-25" tabindex="-1"></a>*Create time-squared <span class="kw">variable</span> <span class="kw">for</span> analyses*</span>
+<span id="cb245-26"><a href="causal-survival-analysis-stata.html#cb245-26" tabindex="-1"></a><span class="kw">gen</span> timesq = time*time</span>
+<span id="cb245-27"><a href="causal-survival-analysis-stata.html#cb245-27" tabindex="-1"></a></span>
+<span id="cb245-28"><a href="causal-survival-analysis-stata.html#cb245-28" tabindex="-1"></a>*Save the dataset to your working directory <span class="kw">for</span> future <span class="kw">use</span>*</span>
+<span id="cb245-29"><a href="causal-survival-analysis-stata.html#cb245-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">replace</span></span>
+<span id="cb245-30"><a href="causal-survival-analysis-stata.html#cb245-30" tabindex="-1"></a></span>
+<span id="cb245-31"><a href="causal-survival-analysis-stata.html#cb245-31" tabindex="-1"></a><span class="co">/**Hazard ratios**/</span></span>
+<span id="cb245-32"><a href="causal-survival-analysis-stata.html#cb245-32" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
+<span id="cb245-33"><a href="causal-survival-analysis-stata.html#cb245-33" tabindex="-1"></a></span>
+<span id="cb245-34"><a href="causal-survival-analysis-stata.html#cb245-34" tabindex="-1"></a>*Fit a pooled <span class="kw">logistic</span> hazards <span class="kw">model</span> *</span>
+<span id="cb245-35"><a href="causal-survival-analysis-stata.html#cb245-35" tabindex="-1"></a><span class="kw">logistic</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
+<span id="cb245-36"><a href="causal-survival-analysis-stata.html#cb245-36" tabindex="-1"></a>  c.time c.time#c.time </span>
+<span id="cb245-37"><a href="causal-survival-analysis-stata.html#cb245-37" tabindex="-1"></a></span>
+<span id="cb245-38"><a href="causal-survival-analysis-stata.html#cb245-38" tabindex="-1"></a><span class="co">/**Survival curves: run regression then do:**/</span></span>
+<span id="cb245-39"><a href="causal-survival-analysis-stata.html#cb245-39" tabindex="-1"></a></span>
+<span id="cb245-40"><a href="causal-survival-analysis-stata.html#cb245-40" tabindex="-1"></a>*Create a dataset with <span class="ot">all</span> time points under each treatment <span class="dv">level</span>*</span>
+<span id="cb245-41"><a href="causal-survival-analysis-stata.html#cb245-41" tabindex="-1"></a>*Re-expand <span class="kw">data</span> with <span class="bn">rows</span> <span class="kw">for</span> <span class="ot">all</span> timepoints*</span>
+<span id="cb245-42"><a href="causal-survival-analysis-stata.html#cb245-42" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
+<span id="cb245-43"><a href="causal-survival-analysis-stata.html#cb245-43" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
+<span id="cb245-44"><a href="causal-survival-analysis-stata.html#cb245-44" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1   </span>
+<span id="cb245-45"><a href="causal-survival-analysis-stata.html#cb245-45" tabindex="-1"></a>        </span>
+<span id="cb245-46"><a href="causal-survival-analysis-stata.html#cb245-46" tabindex="-1"></a><span class="co">/*Create 2 copies of each subject, and set outcome to missing </span></span>
+<span id="cb245-47"><a href="causal-survival-analysis-stata.html#cb245-47" tabindex="-1"></a><span class="co">and treatment -- use only the newobs*/</span></span>
+<span id="cb245-48"><a href="causal-survival-analysis-stata.html#cb245-48" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
+<span id="cb245-49"><a href="causal-survival-analysis-stata.html#cb245-49" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv   </span>
+<span id="cb245-50"><a href="causal-survival-analysis-stata.html#cb245-50" tabindex="-1"></a></span>
+<span id="cb245-51"><a href="causal-survival-analysis-stata.html#cb245-51" tabindex="-1"></a><span class="co">/*Generate predicted event and survival probabilities </span></span>
+<span id="cb245-52"><a href="causal-survival-analysis-stata.html#cb245-52" tabindex="-1"></a><span class="co">for each person each month in copies*/</span></span>
+<span id="cb245-53"><a href="causal-survival-analysis-stata.html#cb245-53" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
+<span id="cb245-54"><a href="causal-survival-analysis-stata.html#cb245-54" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
+<span id="cb245-55"><a href="causal-survival-analysis-stata.html#cb245-55" tabindex="-1"></a><span class="kw">keep</span> seqn time qsmk interv psurv_k </span>
+<span id="cb245-56"><a href="causal-survival-analysis-stata.html#cb245-56" tabindex="-1"></a></span>
+<span id="cb245-57"><a href="causal-survival-analysis-stata.html#cb245-57" tabindex="-1"></a>*Within copies, <span class="kw">generate</span> predicted survival <span class="bn">over</span> time*</span>
+<span id="cb245-58"><a href="causal-survival-analysis-stata.html#cb245-58" tabindex="-1"></a>*Remember, survival is the product <span class="kw">of</span> conditional survival probabilities <span class="kw">in</span> each interval*  </span>
+<span id="cb245-59"><a href="causal-survival-analysis-stata.html#cb245-59" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
+<span id="cb245-60"><a href="causal-survival-analysis-stata.html#cb245-60" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
+<span id="cb245-61"><a href="causal-survival-analysis-stata.html#cb245-61" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
+<span id="cb245-62"><a href="causal-survival-analysis-stata.html#cb245-62" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
+<span id="cb245-63"><a href="causal-survival-analysis-stata.html#cb245-63" tabindex="-1"></a></span>
+<span id="cb245-64"><a href="causal-survival-analysis-stata.html#cb245-64" tabindex="-1"></a>*Display 10-<span class="fu">year</span> standardized survival, under interventions*</span>
+<span id="cb245-65"><a href="causal-survival-analysis-stata.html#cb245-65" tabindex="-1"></a>*Note: since time starts <span class="fu">at</span> 0, <span class="fu">month</span> 119 is 10-<span class="fu">year</span> survival*</span>
+<span id="cb245-66"><a href="causal-survival-analysis-stata.html#cb245-66" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
+<span id="cb245-67"><a href="causal-survival-analysis-stata.html#cb245-67" tabindex="-1"></a></span>
+<span id="cb245-68"><a href="causal-survival-analysis-stata.html#cb245-68" tabindex="-1"></a>*Graph <span class="kw">of</span> standardized survival <span class="bn">over</span> time, under interventions*</span>
+<span id="cb245-69"><a href="causal-survival-analysis-stata.html#cb245-69" tabindex="-1"></a><span class="co">/*Note, we want our graph to start at 100% survival, </span></span>
+<span id="cb245-70"><a href="causal-survival-analysis-stata.html#cb245-70" tabindex="-1"></a><span class="co">so add an extra time point with P(surv) = 1*/</span></span>
+<span id="cb245-71"><a href="causal-survival-analysis-stata.html#cb245-71" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
+<span id="cb245-72"><a href="causal-survival-analysis-stata.html#cb245-72" tabindex="-1"></a><span class="kw">replace</span> psurv  = 1 <span class="kw">if</span> newtime == 1</span>
+<span id="cb245-73"><a href="causal-survival-analysis-stata.html#cb245-73" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
+<span id="cb245-74"><a href="causal-survival-analysis-stata.html#cb245-74" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
+<span id="cb245-75"><a href="causal-survival-analysis-stata.html#cb245-75" tabindex="-1"></a></span>
+<span id="cb245-76"><a href="causal-survival-analysis-stata.html#cb245-76" tabindex="-1"></a><span class="co">/*Separate the survival probabilities to allow plotting by </span></span>
+<span id="cb245-77"><a href="causal-survival-analysis-stata.html#cb245-77" tabindex="-1"></a><span class="co">intervention on qsmk*/</span></span>
+<span id="cb245-78"><a href="causal-survival-analysis-stata.html#cb245-78" tabindex="-1"></a><span class="kw">separate</span> psurv, <span class="kw">by</span>(interv)</span>
+<span id="cb245-79"><a href="causal-survival-analysis-stata.html#cb245-79" tabindex="-1"></a></span>
+<span id="cb245-80"><a href="causal-survival-analysis-stata.html#cb245-80" tabindex="-1"></a>*Plot the curves*</span>
+<span id="cb245-81"><a href="causal-survival-analysis-stata.html#cb245-81" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> psurv0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
+<span id="cb245-82"><a href="causal-survival-analysis-stata.html#cb245-82" tabindex="-1"></a>  (<span class="kw">line</span> psurv1 time2, <span class="kw">sort</span>) <span class="kw">if</span> interv &gt; -1 <span class="co">///</span></span>
+<span id="cb245-83"><a href="causal-survival-analysis-stata.html#cb245-83" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
+<span id="cb245-84"><a href="causal-survival-analysis-stata.html#cb245-84" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
+<span id="cb245-85"><a href="causal-survival-analysis-stata.html#cb245-85" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
+<span id="cb245-86"><a href="causal-survival-analysis-stata.html#cb245-86" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-2.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>(1,566 missing values generated)
 
 (1,275 real changes made)
@@ -579,148 +579,148 @@ <h2>Program 17.3<a href="causal-survival-analysis-stata.html#program-17.3-1" cla
 <li>Section 17.4</li>
 <li>Generates Figure 17.6</li>
 </ul>
-<div class="sourceCode" id="cb130"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb130-1"><a href="causal-survival-analysis-stata.html#cb130-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
-<span id="cb130-2"><a href="causal-survival-analysis-stata.html#cb130-2" tabindex="-1"></a></span>
-<span id="cb130-3"><a href="causal-survival-analysis-stata.html#cb130-3" tabindex="-1"></a><span class="kw">keep</span> seqn event qsmk time sex race age education <span class="co">///</span></span>
-<span id="cb130-4"><a href="causal-survival-analysis-stata.html#cb130-4" tabindex="-1"></a>  smokeintensity smkintensity82_71 smokeyrs <span class="co">///</span></span>
-<span id="cb130-5"><a href="causal-survival-analysis-stata.html#cb130-5" tabindex="-1"></a>  exercise active wt71</span>
-<span id="cb130-6"><a href="causal-survival-analysis-stata.html#cb130-6" tabindex="-1"></a><span class="kw">preserve</span> </span>
-<span id="cb130-7"><a href="causal-survival-analysis-stata.html#cb130-7" tabindex="-1"></a></span>
-<span id="cb130-8"><a href="causal-survival-analysis-stata.html#cb130-8" tabindex="-1"></a>*Estimate weights*</span>
-<span id="cb130-9"><a href="causal-survival-analysis-stata.html#cb130-9" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb130-10"><a href="causal-survival-analysis-stata.html#cb130-10" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb130-11"><a href="causal-survival-analysis-stata.html#cb130-11" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
-<span id="cb130-12"><a href="causal-survival-analysis-stata.html#cb130-12" tabindex="-1"></a>  ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="kw">if</span> time == 0</span>
-<span id="cb130-13"><a href="causal-survival-analysis-stata.html#cb130-13" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
-<span id="cb130-14"><a href="causal-survival-analysis-stata.html#cb130-14" tabindex="-1"></a></span>
-<span id="cb130-15"><a href="causal-survival-analysis-stata.html#cb130-15" tabindex="-1"></a><span class="kw">logit</span> qsmk <span class="kw">if</span> time ==0 </span>
-<span id="cb130-16"><a href="causal-survival-analysis-stata.html#cb130-16" tabindex="-1"></a><span class="kw">predict</span> num, pr</span>
-<span id="cb130-17"><a href="causal-survival-analysis-stata.html#cb130-17" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=num/p_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb130-18"><a href="causal-survival-analysis-stata.html#cb130-18" tabindex="-1"></a><span class="kw">replace</span> <span class="kw">sw</span>=(1-num)/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb130-19"><a href="causal-survival-analysis-stata.html#cb130-19" tabindex="-1"></a><span class="kw">summarize</span> <span class="kw">sw</span></span>
-<span id="cb130-20"><a href="causal-survival-analysis-stata.html#cb130-20" tabindex="-1"></a></span>
-<span id="cb130-21"><a href="causal-survival-analysis-stata.html#cb130-21" tabindex="-1"></a>*IP weighted survival <span class="kw">by</span> smoking cessation*</span>
-<span id="cb130-22"><a href="causal-survival-analysis-stata.html#cb130-22" tabindex="-1"></a><span class="kw">logit</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
-<span id="cb130-23"><a href="causal-survival-analysis-stata.html#cb130-23" tabindex="-1"></a>  c.time c.time#c.time [<span class="kw">pweight</span>=<span class="kw">sw</span>] , <span class="kw">cluster</span>(seqn) </span>
-<span id="cb130-24"><a href="causal-survival-analysis-stata.html#cb130-24" tabindex="-1"></a></span>
-<span id="cb130-25"><a href="causal-survival-analysis-stata.html#cb130-25" tabindex="-1"></a>*Create a dataset with <span class="ot">all</span> time points under each treatment <span class="dv">level</span>*</span>
-<span id="cb130-26"><a href="causal-survival-analysis-stata.html#cb130-26" tabindex="-1"></a>*Re-expand <span class="kw">data</span> with <span class="bn">rows</span> <span class="kw">for</span> <span class="ot">all</span> timepoints*</span>
-<span id="cb130-27"><a href="causal-survival-analysis-stata.html#cb130-27" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
-<span id="cb130-28"><a href="causal-survival-analysis-stata.html#cb130-28" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
-<span id="cb130-29"><a href="causal-survival-analysis-stata.html#cb130-29" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1       </span>
-<span id="cb130-30"><a href="causal-survival-analysis-stata.html#cb130-30" tabindex="-1"></a>        </span>
-<span id="cb130-31"><a href="causal-survival-analysis-stata.html#cb130-31" tabindex="-1"></a><span class="co">/*Create 2 copies of each subject, and set outcome </span></span>
-<span id="cb130-32"><a href="causal-survival-analysis-stata.html#cb130-32" tabindex="-1"></a><span class="co">to missing and treatment -- use only the newobs*/</span></span>
-<span id="cb130-33"><a href="causal-survival-analysis-stata.html#cb130-33" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
-<span id="cb130-34"><a href="causal-survival-analysis-stata.html#cb130-34" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv   </span>
-<span id="cb130-35"><a href="causal-survival-analysis-stata.html#cb130-35" tabindex="-1"></a></span>
-<span id="cb130-36"><a href="causal-survival-analysis-stata.html#cb130-36" tabindex="-1"></a><span class="co">/*Generate predicted event and survival probabilities </span></span>
-<span id="cb130-37"><a href="causal-survival-analysis-stata.html#cb130-37" tabindex="-1"></a><span class="co">for each person each month in copies*/</span></span>
-<span id="cb130-38"><a href="causal-survival-analysis-stata.html#cb130-38" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
-<span id="cb130-39"><a href="causal-survival-analysis-stata.html#cb130-39" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
-<span id="cb130-40"><a href="causal-survival-analysis-stata.html#cb130-40" tabindex="-1"></a><span class="kw">keep</span> seqn time qsmk interv psurv_k </span>
-<span id="cb130-41"><a href="causal-survival-analysis-stata.html#cb130-41" tabindex="-1"></a></span>
-<span id="cb130-42"><a href="causal-survival-analysis-stata.html#cb130-42" tabindex="-1"></a>*Within copies, <span class="kw">generate</span> predicted survival <span class="bn">over</span> time*</span>
-<span id="cb130-43"><a href="causal-survival-analysis-stata.html#cb130-43" tabindex="-1"></a><span class="co">/*Remember, survival is the product of conditional survival</span></span>
-<span id="cb130-44"><a href="causal-survival-analysis-stata.html#cb130-44" tabindex="-1"></a><span class="co">probabilities in each interval*/</span></span>
-<span id="cb130-45"><a href="causal-survival-analysis-stata.html#cb130-45" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
-<span id="cb130-46"><a href="causal-survival-analysis-stata.html#cb130-46" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
-<span id="cb130-47"><a href="causal-survival-analysis-stata.html#cb130-47" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
-<span id="cb130-48"><a href="causal-survival-analysis-stata.html#cb130-48" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
-<span id="cb130-49"><a href="causal-survival-analysis-stata.html#cb130-49" tabindex="-1"></a></span>
-<span id="cb130-50"><a href="causal-survival-analysis-stata.html#cb130-50" tabindex="-1"></a>*Display 10-<span class="fu">year</span> standardized survival, under interventions*</span>
-<span id="cb130-51"><a href="causal-survival-analysis-stata.html#cb130-51" tabindex="-1"></a>*Note: since time starts <span class="fu">at</span> 0, <span class="fu">month</span> 119 is 10-<span class="fu">year</span> survival*</span>
-<span id="cb130-52"><a href="causal-survival-analysis-stata.html#cb130-52" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
-<span id="cb130-53"><a href="causal-survival-analysis-stata.html#cb130-53" tabindex="-1"></a></span>
-<span id="cb130-54"><a href="causal-survival-analysis-stata.html#cb130-54" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> psurv <span class="kw">if</span>(interv==0 &amp; time ==119)</span>
-<span id="cb130-55"><a href="causal-survival-analysis-stata.html#cb130-55" tabindex="-1"></a><span class="fu">matrix</span> input observe = (0,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb130-56"><a href="causal-survival-analysis-stata.html#cb130-56" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> psurv <span class="kw">if</span>(interv==1 &amp; time ==119)</span>
-<span id="cb130-57"><a href="causal-survival-analysis-stata.html#cb130-57" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb130-58"><a href="causal-survival-analysis-stata.html#cb130-58" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \3, observe[2,2]-observe[1,2]) </span>
-<span id="cb130-59"><a href="causal-survival-analysis-stata.html#cb130-59" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe</span>
-<span id="cb130-60"><a href="causal-survival-analysis-stata.html#cb130-60" tabindex="-1"></a></span>
-<span id="cb130-61"><a href="causal-survival-analysis-stata.html#cb130-61" tabindex="-1"></a>*Graph <span class="kw">of</span> standardized survival <span class="bn">over</span> time, under interventions*</span>
-<span id="cb130-62"><a href="causal-survival-analysis-stata.html#cb130-62" tabindex="-1"></a><span class="co">/*Note: since our outcome model has no covariates, </span></span>
-<span id="cb130-63"><a href="causal-survival-analysis-stata.html#cb130-63" tabindex="-1"></a><span class="co">we can plot psurv directly. </span></span>
-<span id="cb130-64"><a href="causal-survival-analysis-stata.html#cb130-64" tabindex="-1"></a><span class="co">If we had covariates we would need to stratify or average across the values*/</span></span>
-<span id="cb130-65"><a href="causal-survival-analysis-stata.html#cb130-65" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
-<span id="cb130-66"><a href="causal-survival-analysis-stata.html#cb130-66" tabindex="-1"></a><span class="kw">replace</span> psurv  = 1 <span class="kw">if</span> newtime == 1</span>
-<span id="cb130-67"><a href="causal-survival-analysis-stata.html#cb130-67" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
-<span id="cb130-68"><a href="causal-survival-analysis-stata.html#cb130-68" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
-<span id="cb130-69"><a href="causal-survival-analysis-stata.html#cb130-69" tabindex="-1"></a><span class="kw">separate</span> psurv, <span class="kw">by</span>(interv) </span>
-<span id="cb130-70"><a href="causal-survival-analysis-stata.html#cb130-70" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> psurv0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
-<span id="cb130-71"><a href="causal-survival-analysis-stata.html#cb130-71" tabindex="-1"></a>  (<span class="kw">line</span> psurv1 time2, <span class="kw">sort</span>) <span class="kw">if</span> interv &gt; -1 <span class="co">///</span></span>
-<span id="cb130-72"><a href="causal-survival-analysis-stata.html#cb130-72" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
-<span id="cb130-73"><a href="causal-survival-analysis-stata.html#cb130-73" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
-<span id="cb130-74"><a href="causal-survival-analysis-stata.html#cb130-74" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
-<span id="cb130-75"><a href="causal-survival-analysis-stata.html#cb130-75" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-3.png, <span class="kw">replace</span></span>
-<span id="cb130-76"><a href="causal-survival-analysis-stata.html#cb130-76" tabindex="-1"></a></span>
-<span id="cb130-77"><a href="causal-survival-analysis-stata.html#cb130-77" tabindex="-1"></a>*remove extra timepoint*</span>
-<span id="cb130-78"><a href="causal-survival-analysis-stata.html#cb130-78" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newtime == 1</span>
-<span id="cb130-79"><a href="causal-survival-analysis-stata.html#cb130-79" tabindex="-1"></a><span class="kw">drop</span> time2</span>
-<span id="cb130-80"><a href="causal-survival-analysis-stata.html#cb130-80" tabindex="-1"></a></span>
-<span id="cb130-81"><a href="causal-survival-analysis-stata.html#cb130-81" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb130-82"><a href="causal-survival-analysis-stata.html#cb130-82" tabindex="-1"></a></span>
-<span id="cb130-83"><a href="causal-survival-analysis-stata.html#cb130-83" tabindex="-1"></a>**Bootstraps**</span>
-<span id="cb130-84"><a href="causal-survival-analysis-stata.html#cb130-84" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std1 , <span class="kw">replace</span></span>
-<span id="cb130-85"><a href="causal-survival-analysis-stata.html#cb130-85" tabindex="-1"></a> </span>
-<span id="cb130-86"><a href="causal-survival-analysis-stata.html#cb130-86" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootipw_surv </span>
-<span id="cb130-87"><a href="causal-survival-analysis-stata.html#cb130-87" tabindex="-1"></a></span>
-<span id="cb130-88"><a href="causal-survival-analysis-stata.html#cb130-88" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootipw_surv , rclass</span>
-<span id="cb130-89"><a href="causal-survival-analysis-stata.html#cb130-89" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std1 , <span class="kw">clear</span></span>
-<span id="cb130-90"><a href="causal-survival-analysis-stata.html#cb130-90" tabindex="-1"></a><span class="kw">preserve</span></span>
-<span id="cb130-91"><a href="causal-survival-analysis-stata.html#cb130-91" tabindex="-1"></a><span class="kw">bsample</span>, <span class="kw">cluster</span>(seqn) idcluster(newseqn)   </span>
-<span id="cb130-92"><a href="causal-survival-analysis-stata.html#cb130-92" tabindex="-1"></a>        </span>
-<span id="cb130-93"><a href="causal-survival-analysis-stata.html#cb130-93" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb130-94"><a href="causal-survival-analysis-stata.html#cb130-94" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb130-95"><a href="causal-survival-analysis-stata.html#cb130-95" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb130-96"><a href="causal-survival-analysis-stata.html#cb130-96" tabindex="-1"></a>    c.wt71##c.wt71 <span class="kw">if</span> time == 0</span>
-<span id="cb130-97"><a href="causal-survival-analysis-stata.html#cb130-97" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
-<span id="cb130-98"><a href="causal-survival-analysis-stata.html#cb130-98" tabindex="-1"></a></span>
-<span id="cb130-99"><a href="causal-survival-analysis-stata.html#cb130-99" tabindex="-1"></a><span class="kw">logit</span> qsmk <span class="kw">if</span> time ==0 </span>
-<span id="cb130-100"><a href="causal-survival-analysis-stata.html#cb130-100" tabindex="-1"></a><span class="kw">predict</span> num, pr</span>
-<span id="cb130-101"><a href="causal-survival-analysis-stata.html#cb130-101" tabindex="-1"></a></span>
-<span id="cb130-102"><a href="causal-survival-analysis-stata.html#cb130-102" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=num/p_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb130-103"><a href="causal-survival-analysis-stata.html#cb130-103" tabindex="-1"></a><span class="kw">replace</span> <span class="kw">sw</span>=(1-num)/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb130-104"><a href="causal-survival-analysis-stata.html#cb130-104" tabindex="-1"></a></span>
-<span id="cb130-105"><a href="causal-survival-analysis-stata.html#cb130-105" tabindex="-1"></a><span class="kw">logit</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
-<span id="cb130-106"><a href="causal-survival-analysis-stata.html#cb130-106" tabindex="-1"></a>  c.time c.time#c.time [<span class="kw">pweight</span>=<span class="kw">sw</span>], <span class="kw">cluster</span>(newseqn) </span>
-<span id="cb130-107"><a href="causal-survival-analysis-stata.html#cb130-107" tabindex="-1"></a>    </span>
-<span id="cb130-108"><a href="causal-survival-analysis-stata.html#cb130-108" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
-<span id="cb130-109"><a href="causal-survival-analysis-stata.html#cb130-109" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
-<span id="cb130-110"><a href="causal-survival-analysis-stata.html#cb130-110" tabindex="-1"></a><span class="kw">bysort</span> newseqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1        </span>
-<span id="cb130-111"><a href="causal-survival-analysis-stata.html#cb130-111" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv_b) </span>
-<span id="cb130-112"><a href="causal-survival-analysis-stata.html#cb130-112" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv_b </span>
-<span id="cb130-113"><a href="causal-survival-analysis-stata.html#cb130-113" tabindex="-1"></a>        </span>
-<span id="cb130-114"><a href="causal-survival-analysis-stata.html#cb130-114" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
-<span id="cb130-115"><a href="causal-survival-analysis-stata.html#cb130-115" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
-<span id="cb130-116"><a href="causal-survival-analysis-stata.html#cb130-116" tabindex="-1"></a><span class="kw">keep</span> newseqn time qsmk interv_b psurv_k </span>
-<span id="cb130-117"><a href="causal-survival-analysis-stata.html#cb130-117" tabindex="-1"></a></span>
-<span id="cb130-118"><a href="causal-survival-analysis-stata.html#cb130-118" tabindex="-1"></a><span class="kw">sort</span> newseqn interv_b time</span>
-<span id="cb130-119"><a href="causal-survival-analysis-stata.html#cb130-119" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
-<span id="cb130-120"><a href="causal-survival-analysis-stata.html#cb130-120" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
-<span id="cb130-121"><a href="causal-survival-analysis-stata.html#cb130-121" tabindex="-1"></a><span class="kw">bysort</span> newseqn interv_b: <span class="co">///</span></span>
-<span id="cb130-122"><a href="causal-survival-analysis-stata.html#cb130-122" tabindex="-1"></a>  <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
-<span id="cb130-123"><a href="causal-survival-analysis-stata.html#cb130-123" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 119</span>
-<span id="cb130-124"><a href="causal-survival-analysis-stata.html#cb130-124" tabindex="-1"></a><span class="kw">bysort</span> interv_b: <span class="kw">egen</span> meanS_b = <span class="kw">mean</span>(psurv)</span>
-<span id="cb130-125"><a href="causal-survival-analysis-stata.html#cb130-125" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk  meanS_b </span>
-<span id="cb130-126"><a href="causal-survival-analysis-stata.html#cb130-126" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newseqn != 1  <span class="co">/* only need one pair */</span></span>
-<span id="cb130-127"><a href="causal-survival-analysis-stata.html#cb130-127" tabindex="-1"></a>    </span>
-<span id="cb130-128"><a href="causal-survival-analysis-stata.html#cb130-128" tabindex="-1"></a><span class="kw">drop</span> newseqn        </span>
-<span id="cb130-129"><a href="causal-survival-analysis-stata.html#cb130-129" tabindex="-1"></a>        </span>
-<span id="cb130-130"><a href="causal-survival-analysis-stata.html#cb130-130" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = meanS_b[1]</span>
-<span id="cb130-131"><a href="causal-survival-analysis-stata.html#cb130-131" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = meanS_b[2]</span>
-<span id="cb130-132"><a href="causal-survival-analysis-stata.html#cb130-132" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span>  boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
-<span id="cb130-133"><a href="causal-survival-analysis-stata.html#cb130-133" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb130-134"><a href="causal-survival-analysis-stata.html#cb130-134" tabindex="-1"></a><span class="kw">end</span>     </span>
-<span id="cb130-135"><a href="causal-survival-analysis-stata.html#cb130-135" tabindex="-1"></a></span>
-<span id="cb130-136"><a href="causal-survival-analysis-stata.html#cb130-136" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">on</span></span>
-<span id="cb130-137"><a href="causal-survival-analysis-stata.html#cb130-137" tabindex="-1"></a><span class="kw">simulate</span> PrY_a0 = <span class="fu">r</span>(boot_0) PrY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
-<span id="cb130-138"><a href="causal-survival-analysis-stata.html#cb130-138" tabindex="-1"></a>  difference=<span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootipw_surv</span>
-<span id="cb130-139"><a href="causal-survival-analysis-stata.html#cb130-139" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">off</span> </span>
-<span id="cb130-140"><a href="causal-survival-analysis-stata.html#cb130-140" tabindex="-1"></a> </span>
-<span id="cb130-141"><a href="causal-survival-analysis-stata.html#cb130-141" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[1..3, 2]&#39;</span>
-<span id="cb130-142"><a href="causal-survival-analysis-stata.html#cb130-142" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629)</span></code></pre></div>
+<div class="sourceCode" id="cb247"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb247-1"><a href="causal-survival-analysis-stata.html#cb247-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
+<span id="cb247-2"><a href="causal-survival-analysis-stata.html#cb247-2" tabindex="-1"></a></span>
+<span id="cb247-3"><a href="causal-survival-analysis-stata.html#cb247-3" tabindex="-1"></a><span class="kw">keep</span> seqn event qsmk time sex race age education <span class="co">///</span></span>
+<span id="cb247-4"><a href="causal-survival-analysis-stata.html#cb247-4" tabindex="-1"></a>  smokeintensity smkintensity82_71 smokeyrs <span class="co">///</span></span>
+<span id="cb247-5"><a href="causal-survival-analysis-stata.html#cb247-5" tabindex="-1"></a>  exercise active wt71</span>
+<span id="cb247-6"><a href="causal-survival-analysis-stata.html#cb247-6" tabindex="-1"></a><span class="kw">preserve</span> </span>
+<span id="cb247-7"><a href="causal-survival-analysis-stata.html#cb247-7" tabindex="-1"></a></span>
+<span id="cb247-8"><a href="causal-survival-analysis-stata.html#cb247-8" tabindex="-1"></a>*Estimate weights*</span>
+<span id="cb247-9"><a href="causal-survival-analysis-stata.html#cb247-9" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb247-10"><a href="causal-survival-analysis-stata.html#cb247-10" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb247-11"><a href="causal-survival-analysis-stata.html#cb247-11" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
+<span id="cb247-12"><a href="causal-survival-analysis-stata.html#cb247-12" tabindex="-1"></a>  ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="kw">if</span> time == 0</span>
+<span id="cb247-13"><a href="causal-survival-analysis-stata.html#cb247-13" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
+<span id="cb247-14"><a href="causal-survival-analysis-stata.html#cb247-14" tabindex="-1"></a></span>
+<span id="cb247-15"><a href="causal-survival-analysis-stata.html#cb247-15" tabindex="-1"></a><span class="kw">logit</span> qsmk <span class="kw">if</span> time ==0 </span>
+<span id="cb247-16"><a href="causal-survival-analysis-stata.html#cb247-16" tabindex="-1"></a><span class="kw">predict</span> num, pr</span>
+<span id="cb247-17"><a href="causal-survival-analysis-stata.html#cb247-17" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=num/p_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb247-18"><a href="causal-survival-analysis-stata.html#cb247-18" tabindex="-1"></a><span class="kw">replace</span> <span class="kw">sw</span>=(1-num)/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb247-19"><a href="causal-survival-analysis-stata.html#cb247-19" tabindex="-1"></a><span class="kw">summarize</span> <span class="kw">sw</span></span>
+<span id="cb247-20"><a href="causal-survival-analysis-stata.html#cb247-20" tabindex="-1"></a></span>
+<span id="cb247-21"><a href="causal-survival-analysis-stata.html#cb247-21" tabindex="-1"></a>*IP weighted survival <span class="kw">by</span> smoking cessation*</span>
+<span id="cb247-22"><a href="causal-survival-analysis-stata.html#cb247-22" tabindex="-1"></a><span class="kw">logit</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
+<span id="cb247-23"><a href="causal-survival-analysis-stata.html#cb247-23" tabindex="-1"></a>  c.time c.time#c.time [<span class="kw">pweight</span>=<span class="kw">sw</span>] , <span class="kw">cluster</span>(seqn) </span>
+<span id="cb247-24"><a href="causal-survival-analysis-stata.html#cb247-24" tabindex="-1"></a></span>
+<span id="cb247-25"><a href="causal-survival-analysis-stata.html#cb247-25" tabindex="-1"></a>*Create a dataset with <span class="ot">all</span> time points under each treatment <span class="dv">level</span>*</span>
+<span id="cb247-26"><a href="causal-survival-analysis-stata.html#cb247-26" tabindex="-1"></a>*Re-expand <span class="kw">data</span> with <span class="bn">rows</span> <span class="kw">for</span> <span class="ot">all</span> timepoints*</span>
+<span id="cb247-27"><a href="causal-survival-analysis-stata.html#cb247-27" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
+<span id="cb247-28"><a href="causal-survival-analysis-stata.html#cb247-28" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
+<span id="cb247-29"><a href="causal-survival-analysis-stata.html#cb247-29" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1       </span>
+<span id="cb247-30"><a href="causal-survival-analysis-stata.html#cb247-30" tabindex="-1"></a>        </span>
+<span id="cb247-31"><a href="causal-survival-analysis-stata.html#cb247-31" tabindex="-1"></a><span class="co">/*Create 2 copies of each subject, and set outcome </span></span>
+<span id="cb247-32"><a href="causal-survival-analysis-stata.html#cb247-32" tabindex="-1"></a><span class="co">to missing and treatment -- use only the newobs*/</span></span>
+<span id="cb247-33"><a href="causal-survival-analysis-stata.html#cb247-33" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
+<span id="cb247-34"><a href="causal-survival-analysis-stata.html#cb247-34" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv   </span>
+<span id="cb247-35"><a href="causal-survival-analysis-stata.html#cb247-35" tabindex="-1"></a></span>
+<span id="cb247-36"><a href="causal-survival-analysis-stata.html#cb247-36" tabindex="-1"></a><span class="co">/*Generate predicted event and survival probabilities </span></span>
+<span id="cb247-37"><a href="causal-survival-analysis-stata.html#cb247-37" tabindex="-1"></a><span class="co">for each person each month in copies*/</span></span>
+<span id="cb247-38"><a href="causal-survival-analysis-stata.html#cb247-38" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
+<span id="cb247-39"><a href="causal-survival-analysis-stata.html#cb247-39" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
+<span id="cb247-40"><a href="causal-survival-analysis-stata.html#cb247-40" tabindex="-1"></a><span class="kw">keep</span> seqn time qsmk interv psurv_k </span>
+<span id="cb247-41"><a href="causal-survival-analysis-stata.html#cb247-41" tabindex="-1"></a></span>
+<span id="cb247-42"><a href="causal-survival-analysis-stata.html#cb247-42" tabindex="-1"></a>*Within copies, <span class="kw">generate</span> predicted survival <span class="bn">over</span> time*</span>
+<span id="cb247-43"><a href="causal-survival-analysis-stata.html#cb247-43" tabindex="-1"></a><span class="co">/*Remember, survival is the product of conditional survival</span></span>
+<span id="cb247-44"><a href="causal-survival-analysis-stata.html#cb247-44" tabindex="-1"></a><span class="co">probabilities in each interval*/</span></span>
+<span id="cb247-45"><a href="causal-survival-analysis-stata.html#cb247-45" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
+<span id="cb247-46"><a href="causal-survival-analysis-stata.html#cb247-46" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
+<span id="cb247-47"><a href="causal-survival-analysis-stata.html#cb247-47" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
+<span id="cb247-48"><a href="causal-survival-analysis-stata.html#cb247-48" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
+<span id="cb247-49"><a href="causal-survival-analysis-stata.html#cb247-49" tabindex="-1"></a></span>
+<span id="cb247-50"><a href="causal-survival-analysis-stata.html#cb247-50" tabindex="-1"></a>*Display 10-<span class="fu">year</span> standardized survival, under interventions*</span>
+<span id="cb247-51"><a href="causal-survival-analysis-stata.html#cb247-51" tabindex="-1"></a>*Note: since time starts <span class="fu">at</span> 0, <span class="fu">month</span> 119 is 10-<span class="fu">year</span> survival*</span>
+<span id="cb247-52"><a href="causal-survival-analysis-stata.html#cb247-52" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
+<span id="cb247-53"><a href="causal-survival-analysis-stata.html#cb247-53" tabindex="-1"></a></span>
+<span id="cb247-54"><a href="causal-survival-analysis-stata.html#cb247-54" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> psurv <span class="kw">if</span>(interv==0 &amp; time ==119)</span>
+<span id="cb247-55"><a href="causal-survival-analysis-stata.html#cb247-55" tabindex="-1"></a><span class="fu">matrix</span> input observe = (0,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb247-56"><a href="causal-survival-analysis-stata.html#cb247-56" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> psurv <span class="kw">if</span>(interv==1 &amp; time ==119)</span>
+<span id="cb247-57"><a href="causal-survival-analysis-stata.html#cb247-57" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb247-58"><a href="causal-survival-analysis-stata.html#cb247-58" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \3, observe[2,2]-observe[1,2]) </span>
+<span id="cb247-59"><a href="causal-survival-analysis-stata.html#cb247-59" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe</span>
+<span id="cb247-60"><a href="causal-survival-analysis-stata.html#cb247-60" tabindex="-1"></a></span>
+<span id="cb247-61"><a href="causal-survival-analysis-stata.html#cb247-61" tabindex="-1"></a>*Graph <span class="kw">of</span> standardized survival <span class="bn">over</span> time, under interventions*</span>
+<span id="cb247-62"><a href="causal-survival-analysis-stata.html#cb247-62" tabindex="-1"></a><span class="co">/*Note: since our outcome model has no covariates, </span></span>
+<span id="cb247-63"><a href="causal-survival-analysis-stata.html#cb247-63" tabindex="-1"></a><span class="co">we can plot psurv directly. </span></span>
+<span id="cb247-64"><a href="causal-survival-analysis-stata.html#cb247-64" tabindex="-1"></a><span class="co">If we had covariates we would need to stratify or average across the values*/</span></span>
+<span id="cb247-65"><a href="causal-survival-analysis-stata.html#cb247-65" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
+<span id="cb247-66"><a href="causal-survival-analysis-stata.html#cb247-66" tabindex="-1"></a><span class="kw">replace</span> psurv  = 1 <span class="kw">if</span> newtime == 1</span>
+<span id="cb247-67"><a href="causal-survival-analysis-stata.html#cb247-67" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
+<span id="cb247-68"><a href="causal-survival-analysis-stata.html#cb247-68" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
+<span id="cb247-69"><a href="causal-survival-analysis-stata.html#cb247-69" tabindex="-1"></a><span class="kw">separate</span> psurv, <span class="kw">by</span>(interv) </span>
+<span id="cb247-70"><a href="causal-survival-analysis-stata.html#cb247-70" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> psurv0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
+<span id="cb247-71"><a href="causal-survival-analysis-stata.html#cb247-71" tabindex="-1"></a>  (<span class="kw">line</span> psurv1 time2, <span class="kw">sort</span>) <span class="kw">if</span> interv &gt; -1 <span class="co">///</span></span>
+<span id="cb247-72"><a href="causal-survival-analysis-stata.html#cb247-72" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
+<span id="cb247-73"><a href="causal-survival-analysis-stata.html#cb247-73" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
+<span id="cb247-74"><a href="causal-survival-analysis-stata.html#cb247-74" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
+<span id="cb247-75"><a href="causal-survival-analysis-stata.html#cb247-75" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-3.png, <span class="kw">replace</span></span>
+<span id="cb247-76"><a href="causal-survival-analysis-stata.html#cb247-76" tabindex="-1"></a></span>
+<span id="cb247-77"><a href="causal-survival-analysis-stata.html#cb247-77" tabindex="-1"></a>*remove extra timepoint*</span>
+<span id="cb247-78"><a href="causal-survival-analysis-stata.html#cb247-78" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newtime == 1</span>
+<span id="cb247-79"><a href="causal-survival-analysis-stata.html#cb247-79" tabindex="-1"></a><span class="kw">drop</span> time2</span>
+<span id="cb247-80"><a href="causal-survival-analysis-stata.html#cb247-80" tabindex="-1"></a></span>
+<span id="cb247-81"><a href="causal-survival-analysis-stata.html#cb247-81" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb247-82"><a href="causal-survival-analysis-stata.html#cb247-82" tabindex="-1"></a></span>
+<span id="cb247-83"><a href="causal-survival-analysis-stata.html#cb247-83" tabindex="-1"></a>**Bootstraps**</span>
+<span id="cb247-84"><a href="causal-survival-analysis-stata.html#cb247-84" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std1 , <span class="kw">replace</span></span>
+<span id="cb247-85"><a href="causal-survival-analysis-stata.html#cb247-85" tabindex="-1"></a> </span>
+<span id="cb247-86"><a href="causal-survival-analysis-stata.html#cb247-86" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootipw_surv </span>
+<span id="cb247-87"><a href="causal-survival-analysis-stata.html#cb247-87" tabindex="-1"></a></span>
+<span id="cb247-88"><a href="causal-survival-analysis-stata.html#cb247-88" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootipw_surv , rclass</span>
+<span id="cb247-89"><a href="causal-survival-analysis-stata.html#cb247-89" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std1 , <span class="kw">clear</span></span>
+<span id="cb247-90"><a href="causal-survival-analysis-stata.html#cb247-90" tabindex="-1"></a><span class="kw">preserve</span></span>
+<span id="cb247-91"><a href="causal-survival-analysis-stata.html#cb247-91" tabindex="-1"></a><span class="kw">bsample</span>, <span class="kw">cluster</span>(seqn) idcluster(newseqn)   </span>
+<span id="cb247-92"><a href="causal-survival-analysis-stata.html#cb247-92" tabindex="-1"></a>        </span>
+<span id="cb247-93"><a href="causal-survival-analysis-stata.html#cb247-93" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb247-94"><a href="causal-survival-analysis-stata.html#cb247-94" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb247-95"><a href="causal-survival-analysis-stata.html#cb247-95" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb247-96"><a href="causal-survival-analysis-stata.html#cb247-96" tabindex="-1"></a>    c.wt71##c.wt71 <span class="kw">if</span> time == 0</span>
+<span id="cb247-97"><a href="causal-survival-analysis-stata.html#cb247-97" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
+<span id="cb247-98"><a href="causal-survival-analysis-stata.html#cb247-98" tabindex="-1"></a></span>
+<span id="cb247-99"><a href="causal-survival-analysis-stata.html#cb247-99" tabindex="-1"></a><span class="kw">logit</span> qsmk <span class="kw">if</span> time ==0 </span>
+<span id="cb247-100"><a href="causal-survival-analysis-stata.html#cb247-100" tabindex="-1"></a><span class="kw">predict</span> num, pr</span>
+<span id="cb247-101"><a href="causal-survival-analysis-stata.html#cb247-101" tabindex="-1"></a></span>
+<span id="cb247-102"><a href="causal-survival-analysis-stata.html#cb247-102" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=num/p_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb247-103"><a href="causal-survival-analysis-stata.html#cb247-103" tabindex="-1"></a><span class="kw">replace</span> <span class="kw">sw</span>=(1-num)/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb247-104"><a href="causal-survival-analysis-stata.html#cb247-104" tabindex="-1"></a></span>
+<span id="cb247-105"><a href="causal-survival-analysis-stata.html#cb247-105" tabindex="-1"></a><span class="kw">logit</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
+<span id="cb247-106"><a href="causal-survival-analysis-stata.html#cb247-106" tabindex="-1"></a>  c.time c.time#c.time [<span class="kw">pweight</span>=<span class="kw">sw</span>], <span class="kw">cluster</span>(newseqn) </span>
+<span id="cb247-107"><a href="causal-survival-analysis-stata.html#cb247-107" tabindex="-1"></a>    </span>
+<span id="cb247-108"><a href="causal-survival-analysis-stata.html#cb247-108" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
+<span id="cb247-109"><a href="causal-survival-analysis-stata.html#cb247-109" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
+<span id="cb247-110"><a href="causal-survival-analysis-stata.html#cb247-110" tabindex="-1"></a><span class="kw">bysort</span> newseqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1        </span>
+<span id="cb247-111"><a href="causal-survival-analysis-stata.html#cb247-111" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv_b) </span>
+<span id="cb247-112"><a href="causal-survival-analysis-stata.html#cb247-112" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv_b </span>
+<span id="cb247-113"><a href="causal-survival-analysis-stata.html#cb247-113" tabindex="-1"></a>        </span>
+<span id="cb247-114"><a href="causal-survival-analysis-stata.html#cb247-114" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
+<span id="cb247-115"><a href="causal-survival-analysis-stata.html#cb247-115" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
+<span id="cb247-116"><a href="causal-survival-analysis-stata.html#cb247-116" tabindex="-1"></a><span class="kw">keep</span> newseqn time qsmk interv_b psurv_k </span>
+<span id="cb247-117"><a href="causal-survival-analysis-stata.html#cb247-117" tabindex="-1"></a></span>
+<span id="cb247-118"><a href="causal-survival-analysis-stata.html#cb247-118" tabindex="-1"></a><span class="kw">sort</span> newseqn interv_b time</span>
+<span id="cb247-119"><a href="causal-survival-analysis-stata.html#cb247-119" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
+<span id="cb247-120"><a href="causal-survival-analysis-stata.html#cb247-120" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
+<span id="cb247-121"><a href="causal-survival-analysis-stata.html#cb247-121" tabindex="-1"></a><span class="kw">bysort</span> newseqn interv_b: <span class="co">///</span></span>
+<span id="cb247-122"><a href="causal-survival-analysis-stata.html#cb247-122" tabindex="-1"></a>  <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
+<span id="cb247-123"><a href="causal-survival-analysis-stata.html#cb247-123" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 119</span>
+<span id="cb247-124"><a href="causal-survival-analysis-stata.html#cb247-124" tabindex="-1"></a><span class="kw">bysort</span> interv_b: <span class="kw">egen</span> meanS_b = <span class="kw">mean</span>(psurv)</span>
+<span id="cb247-125"><a href="causal-survival-analysis-stata.html#cb247-125" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk  meanS_b </span>
+<span id="cb247-126"><a href="causal-survival-analysis-stata.html#cb247-126" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newseqn != 1  <span class="co">/* only need one pair */</span></span>
+<span id="cb247-127"><a href="causal-survival-analysis-stata.html#cb247-127" tabindex="-1"></a>    </span>
+<span id="cb247-128"><a href="causal-survival-analysis-stata.html#cb247-128" tabindex="-1"></a><span class="kw">drop</span> newseqn        </span>
+<span id="cb247-129"><a href="causal-survival-analysis-stata.html#cb247-129" tabindex="-1"></a>        </span>
+<span id="cb247-130"><a href="causal-survival-analysis-stata.html#cb247-130" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = meanS_b[1]</span>
+<span id="cb247-131"><a href="causal-survival-analysis-stata.html#cb247-131" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = meanS_b[2]</span>
+<span id="cb247-132"><a href="causal-survival-analysis-stata.html#cb247-132" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span>  boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
+<span id="cb247-133"><a href="causal-survival-analysis-stata.html#cb247-133" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb247-134"><a href="causal-survival-analysis-stata.html#cb247-134" tabindex="-1"></a><span class="kw">end</span>     </span>
+<span id="cb247-135"><a href="causal-survival-analysis-stata.html#cb247-135" tabindex="-1"></a></span>
+<span id="cb247-136"><a href="causal-survival-analysis-stata.html#cb247-136" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">on</span></span>
+<span id="cb247-137"><a href="causal-survival-analysis-stata.html#cb247-137" tabindex="-1"></a><span class="kw">simulate</span> PrY_a0 = <span class="fu">r</span>(boot_0) PrY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
+<span id="cb247-138"><a href="causal-survival-analysis-stata.html#cb247-138" tabindex="-1"></a>  difference=<span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootipw_surv</span>
+<span id="cb247-139"><a href="causal-survival-analysis-stata.html#cb247-139" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">off</span> </span>
+<span id="cb247-140"><a href="causal-survival-analysis-stata.html#cb247-140" tabindex="-1"></a> </span>
+<span id="cb247-141"><a href="causal-survival-analysis-stata.html#cb247-141" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[1..3, 2]&#39;</span>
+<span id="cb247-142"><a href="causal-survival-analysis-stata.html#cb247-142" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629)</span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -893.02712  
 Iteration 1:  Log likelihood = -839.70016  
 Iteration 2:  Log likelihood = -838.45045  
@@ -907,7 +907,7 @@ <h2>Program 17.3<a href="causal-survival-analysis-stata.html#program-17.3-1" cla
  26. drop if newseqn != 1  /* only need one pair */
  27.         
 
-r; t=0.00 14:49:11
+r; t=0.00 6:50:11
 
       Command: bootipw_surv
        PrY_a0: r(boot_0)
@@ -915,7 +915,7 @@ <h2>Program 17.3<a href="causal-survival-analysis-stata.html#program-17.3-1" cla
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=17.53 14:49:28
+r; t=19.55 6:50:30
 
 
 
@@ -941,122 +941,122 @@ <h2>Program 17.4<a href="causal-survival-analysis-stata.html#program-17.4-1" cla
 <li>Section 17.5</li>
 <li>Generates Figure 17.7</li>
 </ul>
-<div class="sourceCode" id="cb132"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb132-1"><a href="causal-survival-analysis-stata.html#cb132-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
-<span id="cb132-2"><a href="causal-survival-analysis-stata.html#cb132-2" tabindex="-1"></a></span>
-<span id="cb132-3"><a href="causal-survival-analysis-stata.html#cb132-3" tabindex="-1"></a><span class="kw">keep</span> seqn event qsmk time sex race age education <span class="co">///</span></span>
-<span id="cb132-4"><a href="causal-survival-analysis-stata.html#cb132-4" tabindex="-1"></a>  smokeintensity smkintensity82_71  smokeyrs exercise <span class="co">///</span></span>
-<span id="cb132-5"><a href="causal-survival-analysis-stata.html#cb132-5" tabindex="-1"></a>  active wt71 </span>
-<span id="cb132-6"><a href="causal-survival-analysis-stata.html#cb132-6" tabindex="-1"></a><span class="kw">preserve</span></span>
-<span id="cb132-7"><a href="causal-survival-analysis-stata.html#cb132-7" tabindex="-1"></a> </span>
-<span id="cb132-8"><a href="causal-survival-analysis-stata.html#cb132-8" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">logistic</span> event qsmk qsmk#c.time <span class="co">///</span></span>
-<span id="cb132-9"><a href="causal-survival-analysis-stata.html#cb132-9" tabindex="-1"></a>  qsmk#c.time#c.time time c.time#c.time  <span class="co">///</span></span>
-<span id="cb132-10"><a href="causal-survival-analysis-stata.html#cb132-10" tabindex="-1"></a>    sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb132-11"><a href="causal-survival-analysis-stata.html#cb132-11" tabindex="-1"></a>    c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb132-12"><a href="causal-survival-analysis-stata.html#cb132-12" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb132-13"><a href="causal-survival-analysis-stata.html#cb132-13" tabindex="-1"></a>    c.wt71##c.wt71 , <span class="kw">cluster</span>(seqn) </span>
-<span id="cb132-14"><a href="causal-survival-analysis-stata.html#cb132-14" tabindex="-1"></a>            </span>
-<span id="cb132-15"><a href="causal-survival-analysis-stata.html#cb132-15" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
-<span id="cb132-16"><a href="causal-survival-analysis-stata.html#cb132-16" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
-<span id="cb132-17"><a href="causal-survival-analysis-stata.html#cb132-17" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1              </span>
-<span id="cb132-18"><a href="causal-survival-analysis-stata.html#cb132-18" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
-<span id="cb132-19"><a href="causal-survival-analysis-stata.html#cb132-19" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv        </span>
-<span id="cb132-20"><a href="causal-survival-analysis-stata.html#cb132-20" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
-<span id="cb132-21"><a href="causal-survival-analysis-stata.html#cb132-21" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
-<span id="cb132-22"><a href="causal-survival-analysis-stata.html#cb132-22" tabindex="-1"></a><span class="kw">keep</span> seqn  time qsmk interv psurv_k                 </span>
-<span id="cb132-23"><a href="causal-survival-analysis-stata.html#cb132-23" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
-<span id="cb132-24"><a href="causal-survival-analysis-stata.html#cb132-24" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
-<span id="cb132-25"><a href="causal-survival-analysis-stata.html#cb132-25" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
-<span id="cb132-26"><a href="causal-survival-analysis-stata.html#cb132-26" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
-<span id="cb132-27"><a href="causal-survival-analysis-stata.html#cb132-27" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
-<span id="cb132-28"><a href="causal-survival-analysis-stata.html#cb132-28" tabindex="-1"></a></span>
-<span id="cb132-29"><a href="causal-survival-analysis-stata.html#cb132-29" tabindex="-1"></a><span class="kw">keep</span> qsmk interv psurv time   </span>
-<span id="cb132-30"><a href="causal-survival-analysis-stata.html#cb132-30" tabindex="-1"></a>        </span>
-<span id="cb132-31"><a href="causal-survival-analysis-stata.html#cb132-31" tabindex="-1"></a><span class="kw">bysort</span> interv : <span class="kw">egen</span> meanS = <span class="kw">mean</span>(psurv) <span class="kw">if</span> time == 119</span>
-<span id="cb132-32"><a href="causal-survival-analysis-stata.html#cb132-32" tabindex="-1"></a><span class="kw">by</span> interv: <span class="kw">summarize</span> meanS</span>
-<span id="cb132-33"><a href="causal-survival-analysis-stata.html#cb132-33" tabindex="-1"></a></span>
-<span id="cb132-34"><a href="causal-survival-analysis-stata.html#cb132-34" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> meanS <span class="kw">if</span>(qsmk==0  &amp; time ==119)</span>
-<span id="cb132-35"><a href="causal-survival-analysis-stata.html#cb132-35" tabindex="-1"></a><span class="fu">matrix</span> input observe = ( 0,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb132-36"><a href="causal-survival-analysis-stata.html#cb132-36" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> meanS <span class="kw">if</span>(qsmk==1  &amp; time ==119)</span>
-<span id="cb132-37"><a href="causal-survival-analysis-stata.html#cb132-37" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb132-38"><a href="causal-survival-analysis-stata.html#cb132-38" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \2, observe[2,2]-observe[1,2]) </span>
-<span id="cb132-39"><a href="causal-survival-analysis-stata.html#cb132-39" tabindex="-1"></a>*Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen*</span>
-<span id="cb132-40"><a href="causal-survival-analysis-stata.html#cb132-40" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe =  P(Y(a=0)=1) P(Y(a=1)=1) difference</span>
-<span id="cb132-41"><a href="causal-survival-analysis-stata.html#cb132-41" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv survival</span>
-<span id="cb132-42"><a href="causal-survival-analysis-stata.html#cb132-42" tabindex="-1"></a></span>
-<span id="cb132-43"><a href="causal-survival-analysis-stata.html#cb132-43" tabindex="-1"></a>*Graph standardized survival <span class="bn">over</span> time, under interventions*</span>
-<span id="cb132-44"><a href="causal-survival-analysis-stata.html#cb132-44" tabindex="-1"></a><span class="co">/*Note: unlike in Program 17.3, we now have covariates </span></span>
-<span id="cb132-45"><a href="causal-survival-analysis-stata.html#cb132-45" tabindex="-1"></a><span class="co">so we first need to average survival across strata*/</span></span>
-<span id="cb132-46"><a href="causal-survival-analysis-stata.html#cb132-46" tabindex="-1"></a><span class="kw">bysort</span> interv time : <span class="kw">egen</span> meanS_t = <span class="kw">mean</span>(psurv)</span>
-<span id="cb132-47"><a href="causal-survival-analysis-stata.html#cb132-47" tabindex="-1"></a></span>
-<span id="cb132-48"><a href="causal-survival-analysis-stata.html#cb132-48" tabindex="-1"></a>*Now we can <span class="kw">continue</span> with the <span class="kw">graph</span>*</span>
-<span id="cb132-49"><a href="causal-survival-analysis-stata.html#cb132-49" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
-<span id="cb132-50"><a href="causal-survival-analysis-stata.html#cb132-50" tabindex="-1"></a><span class="kw">replace</span> meanS_t  = 1 <span class="kw">if</span> newtime == 1</span>
-<span id="cb132-51"><a href="causal-survival-analysis-stata.html#cb132-51" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
-<span id="cb132-52"><a href="causal-survival-analysis-stata.html#cb132-52" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
-<span id="cb132-53"><a href="causal-survival-analysis-stata.html#cb132-53" tabindex="-1"></a><span class="kw">separate</span> meanS_t, <span class="kw">by</span>(interv) </span>
-<span id="cb132-54"><a href="causal-survival-analysis-stata.html#cb132-54" tabindex="-1"></a></span>
-<span id="cb132-55"><a href="causal-survival-analysis-stata.html#cb132-55" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> meanS_t0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
-<span id="cb132-56"><a href="causal-survival-analysis-stata.html#cb132-56" tabindex="-1"></a>  (<span class="kw">line</span> meanS_t1 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
-<span id="cb132-57"><a href="causal-survival-analysis-stata.html#cb132-57" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
-<span id="cb132-58"><a href="causal-survival-analysis-stata.html#cb132-58" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
-<span id="cb132-59"><a href="causal-survival-analysis-stata.html#cb132-59" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
-<span id="cb132-60"><a href="causal-survival-analysis-stata.html#cb132-60" tabindex="-1"></a><span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-4.png, <span class="kw">replace</span></span>
-<span id="cb132-61"><a href="causal-survival-analysis-stata.html#cb132-61" tabindex="-1"></a></span>
-<span id="cb132-62"><a href="causal-survival-analysis-stata.html#cb132-62" tabindex="-1"></a>*remove extra timepoint*</span>
-<span id="cb132-63"><a href="causal-survival-analysis-stata.html#cb132-63" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newtime == 1</span>
-<span id="cb132-64"><a href="causal-survival-analysis-stata.html#cb132-64" tabindex="-1"></a></span>
-<span id="cb132-65"><a href="causal-survival-analysis-stata.html#cb132-65" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb132-66"><a href="causal-survival-analysis-stata.html#cb132-66" tabindex="-1"></a></span>
-<span id="cb132-67"><a href="causal-survival-analysis-stata.html#cb132-67" tabindex="-1"></a>*Bootstraps*</span>
-<span id="cb132-68"><a href="causal-survival-analysis-stata.html#cb132-68" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std2 , <span class="kw">replace</span></span>
-<span id="cb132-69"><a href="causal-survival-analysis-stata.html#cb132-69" tabindex="-1"></a> </span>
-<span id="cb132-70"><a href="causal-survival-analysis-stata.html#cb132-70" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz_surv</span>
-<span id="cb132-71"><a href="causal-survival-analysis-stata.html#cb132-71" tabindex="-1"></a></span>
-<span id="cb132-72"><a href="causal-survival-analysis-stata.html#cb132-72" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz_surv , rclass</span>
-<span id="cb132-73"><a href="causal-survival-analysis-stata.html#cb132-73" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std2 , <span class="kw">clear</span></span>
-<span id="cb132-74"><a href="causal-survival-analysis-stata.html#cb132-74" tabindex="-1"></a><span class="kw">preserve</span></span>
-<span id="cb132-75"><a href="causal-survival-analysis-stata.html#cb132-75" tabindex="-1"></a></span>
-<span id="cb132-76"><a href="causal-survival-analysis-stata.html#cb132-76" tabindex="-1"></a><span class="kw">bsample</span>, <span class="kw">cluster</span>(seqn) idcluster(newseqn)       </span>
-<span id="cb132-77"><a href="causal-survival-analysis-stata.html#cb132-77" tabindex="-1"></a><span class="kw">logistic</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
-<span id="cb132-78"><a href="causal-survival-analysis-stata.html#cb132-78" tabindex="-1"></a>  time c.time#c.time <span class="co">///</span></span>
-<span id="cb132-79"><a href="causal-survival-analysis-stata.html#cb132-79" tabindex="-1"></a>    sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb132-80"><a href="causal-survival-analysis-stata.html#cb132-80" tabindex="-1"></a>    c.smokeintensity##c.smokeintensity c.smkintensity82_71 <span class="co">///</span></span>
-<span id="cb132-81"><a href="causal-survival-analysis-stata.html#cb132-81" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb132-82"><a href="causal-survival-analysis-stata.html#cb132-82" tabindex="-1"></a>    c.wt71##c.wt71 </span>
-<span id="cb132-83"><a href="causal-survival-analysis-stata.html#cb132-83" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0   </span>
-<span id="cb132-84"><a href="causal-survival-analysis-stata.html#cb132-84" tabindex="-1"></a><span class="co">/*only predict on new version of data */</span></span>
-<span id="cb132-85"><a href="causal-survival-analysis-stata.html#cb132-85" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
-<span id="cb132-86"><a href="causal-survival-analysis-stata.html#cb132-86" tabindex="-1"></a><span class="kw">bysort</span> newseqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1               </span>
-<span id="cb132-87"><a href="causal-survival-analysis-stata.html#cb132-87" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv_b) </span>
-<span id="cb132-88"><a href="causal-survival-analysis-stata.html#cb132-88" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv_b          </span>
-<span id="cb132-89"><a href="causal-survival-analysis-stata.html#cb132-89" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
-<span id="cb132-90"><a href="causal-survival-analysis-stata.html#cb132-90" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
-<span id="cb132-91"><a href="causal-survival-analysis-stata.html#cb132-91" tabindex="-1"></a><span class="kw">keep</span> newseqn  time qsmk psurv_k                 </span>
-<span id="cb132-92"><a href="causal-survival-analysis-stata.html#cb132-92" tabindex="-1"></a><span class="kw">sort</span> newseqn qsmk time</span>
-<span id="cb132-93"><a href="causal-survival-analysis-stata.html#cb132-93" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
-<span id="cb132-94"><a href="causal-survival-analysis-stata.html#cb132-94" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1   </span>
-<span id="cb132-95"><a href="causal-survival-analysis-stata.html#cb132-95" tabindex="-1"></a><span class="kw">bysort</span> newseqn  qsmk: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
-<span id="cb132-96"><a href="causal-survival-analysis-stata.html#cb132-96" tabindex="-1"></a><span class="kw">drop</span>  <span class="kw">if</span> time != 119   <span class="co">/* keep only last observation */</span></span>
-<span id="cb132-97"><a href="causal-survival-analysis-stata.html#cb132-97" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk psurv    </span>
-<span id="cb132-98"><a href="causal-survival-analysis-stata.html#cb132-98" tabindex="-1"></a><span class="co">/* if time is in data for complete graph add time to bysort */</span>  </span>
-<span id="cb132-99"><a href="causal-survival-analysis-stata.html#cb132-99" tabindex="-1"></a><span class="kw">bysort</span> qsmk  : <span class="kw">egen</span> meanS_b = <span class="kw">mean</span>(psurv)</span>
-<span id="cb132-100"><a href="causal-survival-analysis-stata.html#cb132-100" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk  meanS_b </span>
-<span id="cb132-101"><a href="causal-survival-analysis-stata.html#cb132-101" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newseqn != 1  <span class="co">/* only need one pair */</span></span>
-<span id="cb132-102"><a href="causal-survival-analysis-stata.html#cb132-102" tabindex="-1"></a><span class="kw">drop</span> newseqn        </span>
-<span id="cb132-103"><a href="causal-survival-analysis-stata.html#cb132-103" tabindex="-1"></a>    </span>
-<span id="cb132-104"><a href="causal-survival-analysis-stata.html#cb132-104" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = meanS_b[1]</span>
-<span id="cb132-105"><a href="causal-survival-analysis-stata.html#cb132-105" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = meanS_b[2]</span>
-<span id="cb132-106"><a href="causal-survival-analysis-stata.html#cb132-106" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
-<span id="cb132-107"><a href="causal-survival-analysis-stata.html#cb132-107" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb132-108"><a href="causal-survival-analysis-stata.html#cb132-108" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb132-109"><a href="causal-survival-analysis-stata.html#cb132-109" tabindex="-1"></a></span>
-<span id="cb132-110"><a href="causal-survival-analysis-stata.html#cb132-110" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">on</span></span>
-<span id="cb132-111"><a href="causal-survival-analysis-stata.html#cb132-111" tabindex="-1"></a><span class="kw">simulate</span> PrY_a0 = <span class="fu">r</span>(boot_0) PrY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
-<span id="cb132-112"><a href="causal-survival-analysis-stata.html#cb132-112" tabindex="-1"></a>  difference=<span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootstdz_surv</span>
-<span id="cb132-113"><a href="causal-survival-analysis-stata.html#cb132-113" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">off</span> </span>
-<span id="cb132-114"><a href="causal-survival-analysis-stata.html#cb132-114" tabindex="-1"></a> </span>
-<span id="cb132-115"><a href="causal-survival-analysis-stata.html#cb132-115" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[1..3, 2]&#39;</span>
-<span id="cb132-116"><a href="causal-survival-analysis-stata.html#cb132-116" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629)</span></code></pre></div>
+<div class="sourceCode" id="cb249"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb249-1"><a href="causal-survival-analysis-stata.html#cb249-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_surv, <span class="kw">clear</span></span>
+<span id="cb249-2"><a href="causal-survival-analysis-stata.html#cb249-2" tabindex="-1"></a></span>
+<span id="cb249-3"><a href="causal-survival-analysis-stata.html#cb249-3" tabindex="-1"></a><span class="kw">keep</span> seqn event qsmk time sex race age education <span class="co">///</span></span>
+<span id="cb249-4"><a href="causal-survival-analysis-stata.html#cb249-4" tabindex="-1"></a>  smokeintensity smkintensity82_71  smokeyrs exercise <span class="co">///</span></span>
+<span id="cb249-5"><a href="causal-survival-analysis-stata.html#cb249-5" tabindex="-1"></a>  active wt71 </span>
+<span id="cb249-6"><a href="causal-survival-analysis-stata.html#cb249-6" tabindex="-1"></a><span class="kw">preserve</span></span>
+<span id="cb249-7"><a href="causal-survival-analysis-stata.html#cb249-7" tabindex="-1"></a> </span>
+<span id="cb249-8"><a href="causal-survival-analysis-stata.html#cb249-8" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">logistic</span> event qsmk qsmk#c.time <span class="co">///</span></span>
+<span id="cb249-9"><a href="causal-survival-analysis-stata.html#cb249-9" tabindex="-1"></a>  qsmk#c.time#c.time time c.time#c.time  <span class="co">///</span></span>
+<span id="cb249-10"><a href="causal-survival-analysis-stata.html#cb249-10" tabindex="-1"></a>    sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb249-11"><a href="causal-survival-analysis-stata.html#cb249-11" tabindex="-1"></a>    c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb249-12"><a href="causal-survival-analysis-stata.html#cb249-12" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb249-13"><a href="causal-survival-analysis-stata.html#cb249-13" tabindex="-1"></a>    c.wt71##c.wt71 , <span class="kw">cluster</span>(seqn) </span>
+<span id="cb249-14"><a href="causal-survival-analysis-stata.html#cb249-14" tabindex="-1"></a>            </span>
+<span id="cb249-15"><a href="causal-survival-analysis-stata.html#cb249-15" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0</span>
+<span id="cb249-16"><a href="causal-survival-analysis-stata.html#cb249-16" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
+<span id="cb249-17"><a href="causal-survival-analysis-stata.html#cb249-17" tabindex="-1"></a><span class="kw">bysort</span> seqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1              </span>
+<span id="cb249-18"><a href="causal-survival-analysis-stata.html#cb249-18" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv) </span>
+<span id="cb249-19"><a href="causal-survival-analysis-stata.html#cb249-19" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv        </span>
+<span id="cb249-20"><a href="causal-survival-analysis-stata.html#cb249-20" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
+<span id="cb249-21"><a href="causal-survival-analysis-stata.html#cb249-21" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
+<span id="cb249-22"><a href="causal-survival-analysis-stata.html#cb249-22" tabindex="-1"></a><span class="kw">keep</span> seqn  time qsmk interv psurv_k                 </span>
+<span id="cb249-23"><a href="causal-survival-analysis-stata.html#cb249-23" tabindex="-1"></a><span class="kw">sort</span> seqn interv time</span>
+<span id="cb249-24"><a href="causal-survival-analysis-stata.html#cb249-24" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
+<span id="cb249-25"><a href="causal-survival-analysis-stata.html#cb249-25" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1       </span>
+<span id="cb249-26"><a href="causal-survival-analysis-stata.html#cb249-26" tabindex="-1"></a><span class="kw">bysort</span> seqn interv: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
+<span id="cb249-27"><a href="causal-survival-analysis-stata.html#cb249-27" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> psurv <span class="kw">if</span> time == 119</span>
+<span id="cb249-28"><a href="causal-survival-analysis-stata.html#cb249-28" tabindex="-1"></a></span>
+<span id="cb249-29"><a href="causal-survival-analysis-stata.html#cb249-29" tabindex="-1"></a><span class="kw">keep</span> qsmk interv psurv time   </span>
+<span id="cb249-30"><a href="causal-survival-analysis-stata.html#cb249-30" tabindex="-1"></a>        </span>
+<span id="cb249-31"><a href="causal-survival-analysis-stata.html#cb249-31" tabindex="-1"></a><span class="kw">bysort</span> interv : <span class="kw">egen</span> meanS = <span class="kw">mean</span>(psurv) <span class="kw">if</span> time == 119</span>
+<span id="cb249-32"><a href="causal-survival-analysis-stata.html#cb249-32" tabindex="-1"></a><span class="kw">by</span> interv: <span class="kw">summarize</span> meanS</span>
+<span id="cb249-33"><a href="causal-survival-analysis-stata.html#cb249-33" tabindex="-1"></a></span>
+<span id="cb249-34"><a href="causal-survival-analysis-stata.html#cb249-34" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> meanS <span class="kw">if</span>(qsmk==0  &amp; time ==119)</span>
+<span id="cb249-35"><a href="causal-survival-analysis-stata.html#cb249-35" tabindex="-1"></a><span class="fu">matrix</span> input observe = ( 0,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb249-36"><a href="causal-survival-analysis-stata.html#cb249-36" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> meanS <span class="kw">if</span>(qsmk==1  &amp; time ==119)</span>
+<span id="cb249-37"><a href="causal-survival-analysis-stata.html#cb249-37" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb249-38"><a href="causal-survival-analysis-stata.html#cb249-38" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \2, observe[2,2]-observe[1,2]) </span>
+<span id="cb249-39"><a href="causal-survival-analysis-stata.html#cb249-39" tabindex="-1"></a>*Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen*</span>
+<span id="cb249-40"><a href="causal-survival-analysis-stata.html#cb249-40" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe =  P(Y(a=0)=1) P(Y(a=1)=1) difference</span>
+<span id="cb249-41"><a href="causal-survival-analysis-stata.html#cb249-41" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv survival</span>
+<span id="cb249-42"><a href="causal-survival-analysis-stata.html#cb249-42" tabindex="-1"></a></span>
+<span id="cb249-43"><a href="causal-survival-analysis-stata.html#cb249-43" tabindex="-1"></a>*Graph standardized survival <span class="bn">over</span> time, under interventions*</span>
+<span id="cb249-44"><a href="causal-survival-analysis-stata.html#cb249-44" tabindex="-1"></a><span class="co">/*Note: unlike in Program 17.3, we now have covariates </span></span>
+<span id="cb249-45"><a href="causal-survival-analysis-stata.html#cb249-45" tabindex="-1"></a><span class="co">so we first need to average survival across strata*/</span></span>
+<span id="cb249-46"><a href="causal-survival-analysis-stata.html#cb249-46" tabindex="-1"></a><span class="kw">bysort</span> interv time : <span class="kw">egen</span> meanS_t = <span class="kw">mean</span>(psurv)</span>
+<span id="cb249-47"><a href="causal-survival-analysis-stata.html#cb249-47" tabindex="-1"></a></span>
+<span id="cb249-48"><a href="causal-survival-analysis-stata.html#cb249-48" tabindex="-1"></a>*Now we can <span class="kw">continue</span> with the <span class="kw">graph</span>*</span>
+<span id="cb249-49"><a href="causal-survival-analysis-stata.html#cb249-49" tabindex="-1"></a>expand 2 <span class="kw">if</span> time ==0, <span class="kw">generate</span>(newtime)</span>
+<span id="cb249-50"><a href="causal-survival-analysis-stata.html#cb249-50" tabindex="-1"></a><span class="kw">replace</span> meanS_t  = 1 <span class="kw">if</span> newtime == 1</span>
+<span id="cb249-51"><a href="causal-survival-analysis-stata.html#cb249-51" tabindex="-1"></a><span class="kw">gen</span> time2 = 0 <span class="kw">if</span> newtime ==1</span>
+<span id="cb249-52"><a href="causal-survival-analysis-stata.html#cb249-52" tabindex="-1"></a><span class="kw">replace</span> time2 = time + 1 <span class="kw">if</span> newtime == 0</span>
+<span id="cb249-53"><a href="causal-survival-analysis-stata.html#cb249-53" tabindex="-1"></a><span class="kw">separate</span> meanS_t, <span class="kw">by</span>(interv) </span>
+<span id="cb249-54"><a href="causal-survival-analysis-stata.html#cb249-54" tabindex="-1"></a></span>
+<span id="cb249-55"><a href="causal-survival-analysis-stata.html#cb249-55" tabindex="-1"></a><span class="kw">twoway</span> (<span class="kw">line</span> meanS_t0 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
+<span id="cb249-56"><a href="causal-survival-analysis-stata.html#cb249-56" tabindex="-1"></a>  (<span class="kw">line</span> meanS_t1 time2, <span class="kw">sort</span>) <span class="co">///</span></span>
+<span id="cb249-57"><a href="causal-survival-analysis-stata.html#cb249-57" tabindex="-1"></a>  , <span class="kw">ylabel</span>(0.5(0.1)1.0) <span class="kw">xlabel</span>(0(12)120) <span class="co">///</span></span>
+<span id="cb249-58"><a href="causal-survival-analysis-stata.html#cb249-58" tabindex="-1"></a>  <span class="bn">ytitle</span>(<span class="st">&quot;Survival probability&quot;</span>) <span class="bn">xtitle</span>(<span class="st">&quot;Months of follow-up&quot;</span>) <span class="co">///</span></span>
+<span id="cb249-59"><a href="causal-survival-analysis-stata.html#cb249-59" tabindex="-1"></a>  <span class="bn">legend</span>(<span class="kw">label</span>(1 <span class="st">&quot;A=0&quot;</span>) <span class="kw">label</span>(2 <span class="st">&quot;A=1&quot;</span>))</span>
+<span id="cb249-60"><a href="causal-survival-analysis-stata.html#cb249-60" tabindex="-1"></a><span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-17-4.png, <span class="kw">replace</span></span>
+<span id="cb249-61"><a href="causal-survival-analysis-stata.html#cb249-61" tabindex="-1"></a></span>
+<span id="cb249-62"><a href="causal-survival-analysis-stata.html#cb249-62" tabindex="-1"></a>*remove extra timepoint*</span>
+<span id="cb249-63"><a href="causal-survival-analysis-stata.html#cb249-63" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newtime == 1</span>
+<span id="cb249-64"><a href="causal-survival-analysis-stata.html#cb249-64" tabindex="-1"></a></span>
+<span id="cb249-65"><a href="causal-survival-analysis-stata.html#cb249-65" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb249-66"><a href="causal-survival-analysis-stata.html#cb249-66" tabindex="-1"></a></span>
+<span id="cb249-67"><a href="causal-survival-analysis-stata.html#cb249-67" tabindex="-1"></a>*Bootstraps*</span>
+<span id="cb249-68"><a href="causal-survival-analysis-stata.html#cb249-68" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std2 , <span class="kw">replace</span></span>
+<span id="cb249-69"><a href="causal-survival-analysis-stata.html#cb249-69" tabindex="-1"></a> </span>
+<span id="cb249-70"><a href="causal-survival-analysis-stata.html#cb249-70" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz_surv</span>
+<span id="cb249-71"><a href="causal-survival-analysis-stata.html#cb249-71" tabindex="-1"></a></span>
+<span id="cb249-72"><a href="causal-survival-analysis-stata.html#cb249-72" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz_surv , rclass</span>
+<span id="cb249-73"><a href="causal-survival-analysis-stata.html#cb249-73" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std2 , <span class="kw">clear</span></span>
+<span id="cb249-74"><a href="causal-survival-analysis-stata.html#cb249-74" tabindex="-1"></a><span class="kw">preserve</span></span>
+<span id="cb249-75"><a href="causal-survival-analysis-stata.html#cb249-75" tabindex="-1"></a></span>
+<span id="cb249-76"><a href="causal-survival-analysis-stata.html#cb249-76" tabindex="-1"></a><span class="kw">bsample</span>, <span class="kw">cluster</span>(seqn) idcluster(newseqn)       </span>
+<span id="cb249-77"><a href="causal-survival-analysis-stata.html#cb249-77" tabindex="-1"></a><span class="kw">logistic</span> event qsmk qsmk#c.time qsmk#c.time#c.time <span class="co">///</span></span>
+<span id="cb249-78"><a href="causal-survival-analysis-stata.html#cb249-78" tabindex="-1"></a>  time c.time#c.time <span class="co">///</span></span>
+<span id="cb249-79"><a href="causal-survival-analysis-stata.html#cb249-79" tabindex="-1"></a>    sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb249-80"><a href="causal-survival-analysis-stata.html#cb249-80" tabindex="-1"></a>    c.smokeintensity##c.smokeintensity c.smkintensity82_71 <span class="co">///</span></span>
+<span id="cb249-81"><a href="causal-survival-analysis-stata.html#cb249-81" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb249-82"><a href="causal-survival-analysis-stata.html#cb249-82" tabindex="-1"></a>    c.wt71##c.wt71 </span>
+<span id="cb249-83"><a href="causal-survival-analysis-stata.html#cb249-83" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> time != 0   </span>
+<span id="cb249-84"><a href="causal-survival-analysis-stata.html#cb249-84" tabindex="-1"></a><span class="co">/*only predict on new version of data */</span></span>
+<span id="cb249-85"><a href="causal-survival-analysis-stata.html#cb249-85" tabindex="-1"></a>expand 120 <span class="kw">if</span> time ==0 </span>
+<span id="cb249-86"><a href="causal-survival-analysis-stata.html#cb249-86" tabindex="-1"></a><span class="kw">bysort</span> newseqn: <span class="kw">replace</span> time = <span class="dt">_n</span> - 1               </span>
+<span id="cb249-87"><a href="causal-survival-analysis-stata.html#cb249-87" tabindex="-1"></a>expand 2 , <span class="kw">generate</span>(interv_b) </span>
+<span id="cb249-88"><a href="causal-survival-analysis-stata.html#cb249-88" tabindex="-1"></a><span class="kw">replace</span> qsmk = interv_b          </span>
+<span id="cb249-89"><a href="causal-survival-analysis-stata.html#cb249-89" tabindex="-1"></a><span class="kw">predict</span> pevent_k, pr</span>
+<span id="cb249-90"><a href="causal-survival-analysis-stata.html#cb249-90" tabindex="-1"></a><span class="kw">gen</span> psurv_k = 1-pevent_k</span>
+<span id="cb249-91"><a href="causal-survival-analysis-stata.html#cb249-91" tabindex="-1"></a><span class="kw">keep</span> newseqn  time qsmk psurv_k                 </span>
+<span id="cb249-92"><a href="causal-survival-analysis-stata.html#cb249-92" tabindex="-1"></a><span class="kw">sort</span> newseqn qsmk time</span>
+<span id="cb249-93"><a href="causal-survival-analysis-stata.html#cb249-93" tabindex="-1"></a><span class="kw">gen</span> _t = time + 1</span>
+<span id="cb249-94"><a href="causal-survival-analysis-stata.html#cb249-94" tabindex="-1"></a><span class="kw">gen</span> psurv = psurv_k <span class="kw">if</span> _t ==1   </span>
+<span id="cb249-95"><a href="causal-survival-analysis-stata.html#cb249-95" tabindex="-1"></a><span class="kw">bysort</span> newseqn  qsmk: <span class="kw">replace</span> psurv = psurv_k*psurv[_t-1] <span class="kw">if</span> _t &gt;1 </span>
+<span id="cb249-96"><a href="causal-survival-analysis-stata.html#cb249-96" tabindex="-1"></a><span class="kw">drop</span>  <span class="kw">if</span> time != 119   <span class="co">/* keep only last observation */</span></span>
+<span id="cb249-97"><a href="causal-survival-analysis-stata.html#cb249-97" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk psurv    </span>
+<span id="cb249-98"><a href="causal-survival-analysis-stata.html#cb249-98" tabindex="-1"></a><span class="co">/* if time is in data for complete graph add time to bysort */</span>  </span>
+<span id="cb249-99"><a href="causal-survival-analysis-stata.html#cb249-99" tabindex="-1"></a><span class="kw">bysort</span> qsmk  : <span class="kw">egen</span> meanS_b = <span class="kw">mean</span>(psurv)</span>
+<span id="cb249-100"><a href="causal-survival-analysis-stata.html#cb249-100" tabindex="-1"></a><span class="kw">keep</span> newseqn qsmk  meanS_b </span>
+<span id="cb249-101"><a href="causal-survival-analysis-stata.html#cb249-101" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> newseqn != 1  <span class="co">/* only need one pair */</span></span>
+<span id="cb249-102"><a href="causal-survival-analysis-stata.html#cb249-102" tabindex="-1"></a><span class="kw">drop</span> newseqn        </span>
+<span id="cb249-103"><a href="causal-survival-analysis-stata.html#cb249-103" tabindex="-1"></a>    </span>
+<span id="cb249-104"><a href="causal-survival-analysis-stata.html#cb249-104" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = meanS_b[1]</span>
+<span id="cb249-105"><a href="causal-survival-analysis-stata.html#cb249-105" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = meanS_b[2]</span>
+<span id="cb249-106"><a href="causal-survival-analysis-stata.html#cb249-106" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
+<span id="cb249-107"><a href="causal-survival-analysis-stata.html#cb249-107" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb249-108"><a href="causal-survival-analysis-stata.html#cb249-108" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb249-109"><a href="causal-survival-analysis-stata.html#cb249-109" tabindex="-1"></a></span>
+<span id="cb249-110"><a href="causal-survival-analysis-stata.html#cb249-110" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">on</span></span>
+<span id="cb249-111"><a href="causal-survival-analysis-stata.html#cb249-111" tabindex="-1"></a><span class="kw">simulate</span> PrY_a0 = <span class="fu">r</span>(boot_0) PrY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
+<span id="cb249-112"><a href="causal-survival-analysis-stata.html#cb249-112" tabindex="-1"></a>  difference=<span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootstdz_surv</span>
+<span id="cb249-113"><a href="causal-survival-analysis-stata.html#cb249-113" tabindex="-1"></a><span class="kw">set</span> <span class="dv">rmsg</span> <span class="kw">off</span> </span>
+<span id="cb249-114"><a href="causal-survival-analysis-stata.html#cb249-114" tabindex="-1"></a> </span>
+<span id="cb249-115"><a href="causal-survival-analysis-stata.html#cb249-115" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[1..3, 2]&#39;</span>
+<span id="cb249-116"><a href="causal-survival-analysis-stata.html#cb249-116" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629)</span></code></pre></div>
 <pre><code>(169,510 observations deleted)
 
 (186,354 observations created)
@@ -1136,7 +1136,7 @@ <h2>Program 17.4<a href="causal-survival-analysis-stata.html#program-17.4-1" cla
                                                 observation
 
 
-file /Users/eptmp/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
+file /Users/tom/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
     format
 
 (3,132 observations deleted)
@@ -1147,7 +1147,7 @@ <h2>Program 17.4<a href="causal-survival-analysis-stata.html#program-17.4-1" cla
   5. drop if time != 0       
   6. /*only predict on new version of data */
 
-r; t=0.00 14:49:35
+r; t=0.00 6:50:38
 
       Command: bootstdz_surv
        PrY_a0: r(boot_0)
@@ -1155,7 +1155,7 @@ <h2>Program 17.4<a href="causal-survival-analysis-stata.html#program-17.4-1" cla
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=22.22 14:49:57
+r; t=23.33 6:51:02
 
 
 
diff --git a/docs/causal-survival-analysis.html b/docs/causal-survival-analysis.html
index f78f8d3..bb67bef 100644
--- a/docs/causal-survival-analysis.html
+++ b/docs/causal-survival-analysis.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -316,49 +316,49 @@ <h2>Program 17.1<a href="causal-survival-analysis.html#program-17.1" class="anch
 <li>Nonparametric estimation of survival curves</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb43"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb43-1"><a href="causal-survival-analysis.html#cb43-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb44"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb44-1"><a href="causal-survival-analysis.html#cb44-1" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb44-2"><a href="causal-survival-analysis.html#cb44-2" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>,<span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb44-3"><a href="causal-survival-analysis.html#cb44-3" tabindex="-1"></a></span>
-<span id="cb44-4"><a href="causal-survival-analysis.html#cb44-4" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
-<span id="cb44-5"><a href="causal-survival-analysis.html#cb44-5" tabindex="-1"></a>nhefs<span class="sc">$</span>survtime <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>death<span class="sc">==</span><span class="dv">0</span>, <span class="dv">120</span>,</span>
-<span id="cb44-6"><a href="causal-survival-analysis.html#cb44-6" tabindex="-1"></a>                         (nhefs<span class="sc">$</span>yrdth<span class="dv">-83</span>)<span class="sc">*</span><span class="dv">12</span><span class="sc">+</span>nhefs<span class="sc">$</span>modth) <span class="co"># yrdth ranges from 83 to 92</span></span>
-<span id="cb44-7"><a href="causal-survival-analysis.html#cb44-7" tabindex="-1"></a></span>
-<span id="cb44-8"><a href="causal-survival-analysis.html#cb44-8" tabindex="-1"></a><span class="fu">table</span>(nhefs<span class="sc">$</span>death, nhefs<span class="sc">$</span>qsmk)</span>
-<span id="cb44-9"><a href="causal-survival-analysis.html#cb44-9" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb44-10"><a href="causal-survival-analysis.html#cb44-10" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
-<span id="cb44-11"><a href="causal-survival-analysis.html#cb44-11" tabindex="-1"></a><span class="co">#&gt;   0 985 326</span></span>
-<span id="cb44-12"><a href="causal-survival-analysis.html#cb44-12" tabindex="-1"></a><span class="co">#&gt;   1 216 102</span></span>
-<span id="cb44-13"><a href="causal-survival-analysis.html#cb44-13" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>),]<span class="sc">$</span>survtime)</span>
-<span id="cb44-14"><a href="causal-survival-analysis.html#cb44-14" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb44-15"><a href="causal-survival-analysis.html#cb44-15" tabindex="-1"></a><span class="co">#&gt;    1.00   35.00   61.00   61.14   86.75  120.00</span></span>
-<span id="cb44-16"><a href="causal-survival-analysis.html#cb44-16" tabindex="-1"></a></span>
-<span id="cb44-17"><a href="causal-survival-analysis.html#cb44-17" tabindex="-1"></a><span class="co">#install.packages(&quot;survival&quot;)</span></span>
-<span id="cb44-18"><a href="causal-survival-analysis.html#cb44-18" tabindex="-1"></a><span class="co">#install.packages(&quot;ggplot2&quot;) # for plots</span></span>
-<span id="cb44-19"><a href="causal-survival-analysis.html#cb44-19" tabindex="-1"></a><span class="co">#install.packages(&quot;survminer&quot;) # for plots</span></span>
-<span id="cb44-20"><a href="causal-survival-analysis.html#cb44-20" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;survival&quot;</span>)</span>
-<span id="cb44-21"><a href="causal-survival-analysis.html#cb44-21" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;ggplot2&quot;</span>)</span>
-<span id="cb44-22"><a href="causal-survival-analysis.html#cb44-22" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;survminer&quot;</span>)</span>
-<span id="cb44-23"><a href="causal-survival-analysis.html#cb44-23" tabindex="-1"></a><span class="co">#&gt; Loading required package: ggpubr</span></span>
-<span id="cb44-24"><a href="causal-survival-analysis.html#cb44-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb44-25"><a href="causal-survival-analysis.html#cb44-25" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;survminer&#39;</span></span>
-<span id="cb44-26"><a href="causal-survival-analysis.html#cb44-26" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:survival&#39;:</span></span>
-<span id="cb44-27"><a href="causal-survival-analysis.html#cb44-27" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb44-28"><a href="causal-survival-analysis.html#cb44-28" tabindex="-1"></a><span class="co">#&gt;     myeloma</span></span>
-<span id="cb44-29"><a href="causal-survival-analysis.html#cb44-29" tabindex="-1"></a><span class="fu">survdiff</span>(<span class="fu">Surv</span>(survtime, death) <span class="sc">~</span> qsmk, <span class="at">data=</span>nhefs)</span>
-<span id="cb44-30"><a href="causal-survival-analysis.html#cb44-30" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb44-31"><a href="causal-survival-analysis.html#cb44-31" tabindex="-1"></a><span class="co">#&gt; survdiff(formula = Surv(survtime, death) ~ qsmk, data = nhefs)</span></span>
-<span id="cb44-32"><a href="causal-survival-analysis.html#cb44-32" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb44-33"><a href="causal-survival-analysis.html#cb44-33" tabindex="-1"></a><span class="co">#&gt;           N Observed Expected (O-E)^2/E (O-E)^2/V</span></span>
-<span id="cb44-34"><a href="causal-survival-analysis.html#cb44-34" tabindex="-1"></a><span class="co">#&gt; qsmk=0 1201      216    237.5      1.95      7.73</span></span>
-<span id="cb44-35"><a href="causal-survival-analysis.html#cb44-35" tabindex="-1"></a><span class="co">#&gt; qsmk=1  428      102     80.5      5.76      7.73</span></span>
-<span id="cb44-36"><a href="causal-survival-analysis.html#cb44-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb44-37"><a href="causal-survival-analysis.html#cb44-37" tabindex="-1"></a><span class="co">#&gt;  Chisq= 7.7  on 1 degrees of freedom, p= 0.005</span></span>
-<span id="cb44-38"><a href="causal-survival-analysis.html#cb44-38" tabindex="-1"></a></span>
-<span id="cb44-39"><a href="causal-survival-analysis.html#cb44-39" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">survfit</span>(<span class="fu">Surv</span>(survtime, death) <span class="sc">~</span> qsmk, <span class="at">data=</span>nhefs)</span>
-<span id="cb44-40"><a href="causal-survival-analysis.html#cb44-40" tabindex="-1"></a><span class="fu">ggsurvplot</span>(fit, <span class="at">data =</span> nhefs, <span class="at">xlab=</span><span class="st">&quot;Months of follow-up&quot;</span>,</span>
-<span id="cb44-41"><a href="causal-survival-analysis.html#cb44-41" tabindex="-1"></a>           <span class="at">ylab=</span><span class="st">&quot;Survival probability&quot;</span>,</span>
-<span id="cb44-42"><a href="causal-survival-analysis.html#cb44-42" tabindex="-1"></a>           <span class="at">main=</span><span class="st">&quot;Product-Limit Survival Estimates&quot;</span>, <span class="at">risk.table =</span> <span class="cn">TRUE</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb150"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb150-1"><a href="causal-survival-analysis.html#cb150-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb151"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb151-1"><a href="causal-survival-analysis.html#cb151-1" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb151-2"><a href="causal-survival-analysis.html#cb151-2" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>,<span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb151-3"><a href="causal-survival-analysis.html#cb151-3" tabindex="-1"></a></span>
+<span id="cb151-4"><a href="causal-survival-analysis.html#cb151-4" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
+<span id="cb151-5"><a href="causal-survival-analysis.html#cb151-5" tabindex="-1"></a>nhefs<span class="sc">$</span>survtime <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>death<span class="sc">==</span><span class="dv">0</span>, <span class="dv">120</span>,</span>
+<span id="cb151-6"><a href="causal-survival-analysis.html#cb151-6" tabindex="-1"></a>                         (nhefs<span class="sc">$</span>yrdth<span class="dv">-83</span>)<span class="sc">*</span><span class="dv">12</span><span class="sc">+</span>nhefs<span class="sc">$</span>modth) <span class="co"># yrdth ranges from 83 to 92</span></span>
+<span id="cb151-7"><a href="causal-survival-analysis.html#cb151-7" tabindex="-1"></a></span>
+<span id="cb151-8"><a href="causal-survival-analysis.html#cb151-8" tabindex="-1"></a><span class="fu">table</span>(nhefs<span class="sc">$</span>death, nhefs<span class="sc">$</span>qsmk)</span>
+<span id="cb151-9"><a href="causal-survival-analysis.html#cb151-9" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb151-10"><a href="causal-survival-analysis.html#cb151-10" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
+<span id="cb151-11"><a href="causal-survival-analysis.html#cb151-11" tabindex="-1"></a><span class="co">#&gt;   0 985 326</span></span>
+<span id="cb151-12"><a href="causal-survival-analysis.html#cb151-12" tabindex="-1"></a><span class="co">#&gt;   1 216 102</span></span></code></pre></div>
+<div class="sourceCode" id="cb152"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb152-1"><a href="causal-survival-analysis.html#cb152-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>),]<span class="sc">$</span>survtime)</span>
+<span id="cb152-2"><a href="causal-survival-analysis.html#cb152-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb152-3"><a href="causal-survival-analysis.html#cb152-3" tabindex="-1"></a><span class="co">#&gt;    1.00   35.00   61.00   61.14   86.75  120.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb153"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb153-1"><a href="causal-survival-analysis.html#cb153-1" tabindex="-1"></a></span>
+<span id="cb153-2"><a href="causal-survival-analysis.html#cb153-2" tabindex="-1"></a><span class="co">#install.packages(&quot;survival&quot;)</span></span>
+<span id="cb153-3"><a href="causal-survival-analysis.html#cb153-3" tabindex="-1"></a><span class="co">#install.packages(&quot;ggplot2&quot;) # for plots</span></span>
+<span id="cb153-4"><a href="causal-survival-analysis.html#cb153-4" tabindex="-1"></a><span class="co">#install.packages(&quot;survminer&quot;) # for plots</span></span>
+<span id="cb153-5"><a href="causal-survival-analysis.html#cb153-5" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;survival&quot;</span>)</span>
+<span id="cb153-6"><a href="causal-survival-analysis.html#cb153-6" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;ggplot2&quot;</span>)</span>
+<span id="cb153-7"><a href="causal-survival-analysis.html#cb153-7" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;survminer&quot;</span>)</span>
+<span id="cb153-8"><a href="causal-survival-analysis.html#cb153-8" tabindex="-1"></a><span class="co">#&gt; Loading required package: ggpubr</span></span>
+<span id="cb153-9"><a href="causal-survival-analysis.html#cb153-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb153-10"><a href="causal-survival-analysis.html#cb153-10" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;survminer&#39;</span></span>
+<span id="cb153-11"><a href="causal-survival-analysis.html#cb153-11" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:survival&#39;:</span></span>
+<span id="cb153-12"><a href="causal-survival-analysis.html#cb153-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb153-13"><a href="causal-survival-analysis.html#cb153-13" tabindex="-1"></a><span class="co">#&gt;     myeloma</span></span></code></pre></div>
+<div class="sourceCode" id="cb154"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb154-1"><a href="causal-survival-analysis.html#cb154-1" tabindex="-1"></a><span class="fu">survdiff</span>(<span class="fu">Surv</span>(survtime, death) <span class="sc">~</span> qsmk, <span class="at">data=</span>nhefs)</span>
+<span id="cb154-2"><a href="causal-survival-analysis.html#cb154-2" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb154-3"><a href="causal-survival-analysis.html#cb154-3" tabindex="-1"></a><span class="co">#&gt; survdiff(formula = Surv(survtime, death) ~ qsmk, data = nhefs)</span></span>
+<span id="cb154-4"><a href="causal-survival-analysis.html#cb154-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb154-5"><a href="causal-survival-analysis.html#cb154-5" tabindex="-1"></a><span class="co">#&gt;           N Observed Expected (O-E)^2/E (O-E)^2/V</span></span>
+<span id="cb154-6"><a href="causal-survival-analysis.html#cb154-6" tabindex="-1"></a><span class="co">#&gt; qsmk=0 1201      216    237.5      1.95      7.73</span></span>
+<span id="cb154-7"><a href="causal-survival-analysis.html#cb154-7" tabindex="-1"></a><span class="co">#&gt; qsmk=1  428      102     80.5      5.76      7.73</span></span>
+<span id="cb154-8"><a href="causal-survival-analysis.html#cb154-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb154-9"><a href="causal-survival-analysis.html#cb154-9" tabindex="-1"></a><span class="co">#&gt;  Chisq= 7.7  on 1 degrees of freedom, p= 0.005</span></span></code></pre></div>
+<div class="sourceCode" id="cb155"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb155-1"><a href="causal-survival-analysis.html#cb155-1" tabindex="-1"></a></span>
+<span id="cb155-2"><a href="causal-survival-analysis.html#cb155-2" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">survfit</span>(<span class="fu">Surv</span>(survtime, death) <span class="sc">~</span> qsmk, <span class="at">data=</span>nhefs)</span>
+<span id="cb155-3"><a href="causal-survival-analysis.html#cb155-3" tabindex="-1"></a><span class="fu">ggsurvplot</span>(fit, <span class="at">data =</span> nhefs, <span class="at">xlab=</span><span class="st">&quot;Months of follow-up&quot;</span>,</span>
+<span id="cb155-4"><a href="causal-survival-analysis.html#cb155-4" tabindex="-1"></a>           <span class="at">ylab=</span><span class="st">&quot;Survival probability&quot;</span>,</span>
+<span id="cb155-5"><a href="causal-survival-analysis.html#cb155-5" tabindex="-1"></a>           <span class="at">main=</span><span class="st">&quot;Product-Limit Survival Estimates&quot;</span>, <span class="at">risk.table =</span> <span class="cn">TRUE</span>)</span></code></pre></div>
 <p><img src="17-causal-surv-r_files/figure-html/unnamed-chunk-2-1.png" width="85%" style="display: block; margin: auto;" /></p>
 </div>
 <div id="program-17.2" class="section level2 hasAnchor">
@@ -367,74 +367,74 @@ <h2>Program 17.2<a href="causal-survival-analysis.html#program-17.2" class="anch
 <li>Parametric estimation of survival curves via hazards model</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb45"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb45-1"><a href="causal-survival-analysis.html#cb45-1" tabindex="-1"></a><span class="co"># creation of person-month data</span></span>
-<span id="cb45-2"><a href="causal-survival-analysis.html#cb45-2" tabindex="-1"></a><span class="co">#install.packages(&quot;splitstackshape&quot;)</span></span>
-<span id="cb45-3"><a href="causal-survival-analysis.html#cb45-3" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;splitstackshape&quot;</span>)</span>
-<span id="cb45-4"><a href="causal-survival-analysis.html#cb45-4" tabindex="-1"></a>nhefs.surv <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="st">&quot;survtime&quot;</span>, <span class="at">drop=</span>F)</span>
-<span id="cb45-5"><a href="causal-survival-analysis.html#cb45-5" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">sequence</span>(<span class="fu">rle</span>(nhefs.surv<span class="sc">$</span>seqn)<span class="sc">$</span>lengths)<span class="sc">-</span><span class="dv">1</span></span>
-<span id="cb45-6"><a href="causal-survival-analysis.html#cb45-6" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>event <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.surv<span class="sc">$</span>time<span class="sc">==</span>nhefs.surv<span class="sc">$</span>survtime<span class="dv">-1</span> <span class="sc">&amp;</span></span>
-<span id="cb45-7"><a href="causal-survival-analysis.html#cb45-7" tabindex="-1"></a>                             nhefs.surv<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb45-8"><a href="causal-survival-analysis.html#cb45-8" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>timesq <span class="ot">&lt;-</span> nhefs.surv<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
-<span id="cb45-9"><a href="causal-survival-analysis.html#cb45-9" tabindex="-1"></a></span>
-<span id="cb45-10"><a href="causal-survival-analysis.html#cb45-10" tabindex="-1"></a><span class="co"># fit of parametric hazards model</span></span>
-<span id="cb45-11"><a href="causal-survival-analysis.html#cb45-11" tabindex="-1"></a>hazards.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq) <span class="sc">+</span></span>
-<span id="cb45-12"><a href="causal-survival-analysis.html#cb45-12" tabindex="-1"></a>                       time <span class="sc">+</span> timesq, <span class="at">family=</span><span class="fu">binomial</span>(), <span class="at">data=</span>nhefs.surv)</span>
-<span id="cb45-13"><a href="causal-survival-analysis.html#cb45-13" tabindex="-1"></a><span class="fu">summary</span>(hazards.model)</span>
-<span id="cb45-14"><a href="causal-survival-analysis.html#cb45-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb45-15"><a href="causal-survival-analysis.html#cb45-15" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb45-16"><a href="causal-survival-analysis.html#cb45-16" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
-<span id="cb45-17"><a href="causal-survival-analysis.html#cb45-17" tabindex="-1"></a><span class="co">#&gt;     time + timesq, family = binomial(), data = nhefs.surv)</span></span>
-<span id="cb45-18"><a href="causal-survival-analysis.html#cb45-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb45-19"><a href="causal-survival-analysis.html#cb45-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb45-20"><a href="causal-survival-analysis.html#cb45-20" tabindex="-1"></a><span class="co">#&gt;                    Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb45-21"><a href="causal-survival-analysis.html#cb45-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)       6.996e+00  2.309e-01  30.292   &lt;2e-16 ***</span></span>
-<span id="cb45-22"><a href="causal-survival-analysis.html#cb45-22" tabindex="-1"></a><span class="co">#&gt; qsmk             -3.355e-01  3.970e-01  -0.845   0.3981    </span></span>
-<span id="cb45-23"><a href="causal-survival-analysis.html#cb45-23" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)   -1.208e-02  1.503e-02  -0.804   0.4215    </span></span>
-<span id="cb45-24"><a href="causal-survival-analysis.html#cb45-24" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)  1.612e-04  1.246e-04   1.293   0.1960    </span></span>
-<span id="cb45-25"><a href="causal-survival-analysis.html#cb45-25" tabindex="-1"></a><span class="co">#&gt; time             -1.960e-02  8.413e-03  -2.329   0.0198 *  </span></span>
-<span id="cb45-26"><a href="causal-survival-analysis.html#cb45-26" tabindex="-1"></a><span class="co">#&gt; timesq            1.256e-04  6.686e-05   1.878   0.0604 .  </span></span>
-<span id="cb45-27"><a href="causal-survival-analysis.html#cb45-27" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb45-28"><a href="causal-survival-analysis.html#cb45-28" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb45-29"><a href="causal-survival-analysis.html#cb45-29" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb45-30"><a href="causal-survival-analysis.html#cb45-30" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb45-31"><a href="causal-survival-analysis.html#cb45-31" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb45-32"><a href="causal-survival-analysis.html#cb45-32" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4655.3  on 176763  degrees of freedom</span></span>
-<span id="cb45-33"><a href="causal-survival-analysis.html#cb45-33" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4631.3  on 176758  degrees of freedom</span></span>
-<span id="cb45-34"><a href="causal-survival-analysis.html#cb45-34" tabindex="-1"></a><span class="co">#&gt; AIC: 4643.3</span></span>
-<span id="cb45-35"><a href="causal-survival-analysis.html#cb45-35" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb45-36"><a href="causal-survival-analysis.html#cb45-36" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 9</span></span>
-<span id="cb45-37"><a href="causal-survival-analysis.html#cb45-37" tabindex="-1"></a></span>
-<span id="cb45-38"><a href="causal-survival-analysis.html#cb45-38" tabindex="-1"></a><span class="co"># creation of dataset with all time points under each treatment level</span></span>
-<span id="cb45-39"><a href="causal-survival-analysis.html#cb45-39" tabindex="-1"></a>qsmk0 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">0</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb45-40"><a href="causal-survival-analysis.html#cb45-40" tabindex="-1"></a>qsmk1 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">1</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb45-41"><a href="causal-survival-analysis.html#cb45-41" tabindex="-1"></a></span>
-<span id="cb45-42"><a href="causal-survival-analysis.html#cb45-42" tabindex="-1"></a><span class="fu">colnames</span>(qsmk0) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
-<span id="cb45-43"><a href="causal-survival-analysis.html#cb45-43" tabindex="-1"></a><span class="fu">colnames</span>(qsmk1) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
-<span id="cb45-44"><a href="causal-survival-analysis.html#cb45-44" tabindex="-1"></a></span>
-<span id="cb45-45"><a href="causal-survival-analysis.html#cb45-45" tabindex="-1"></a><span class="co"># assignment of estimated (1-hazard) to each person-month */</span></span>
-<span id="cb45-46"><a href="causal-survival-analysis.html#cb45-46" tabindex="-1"></a>qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(hazards.model, qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb45-47"><a href="causal-survival-analysis.html#cb45-47" tabindex="-1"></a>qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(hazards.model, qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb45-48"><a href="causal-survival-analysis.html#cb45-48" tabindex="-1"></a></span>
-<span id="cb45-49"><a href="causal-survival-analysis.html#cb45-49" tabindex="-1"></a><span class="co"># computation of survival for each person-month</span></span>
-<span id="cb45-50"><a href="causal-survival-analysis.html#cb45-50" tabindex="-1"></a>qsmk0<span class="sc">$</span>surv0 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(qsmk0<span class="sc">$</span>p.noevent0)</span>
-<span id="cb45-51"><a href="causal-survival-analysis.html#cb45-51" tabindex="-1"></a>qsmk1<span class="sc">$</span>surv1 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(qsmk1<span class="sc">$</span>p.noevent1)</span>
-<span id="cb45-52"><a href="causal-survival-analysis.html#cb45-52" tabindex="-1"></a></span>
-<span id="cb45-53"><a href="causal-survival-analysis.html#cb45-53" tabindex="-1"></a><span class="co"># some data management to plot estimated survival curves</span></span>
-<span id="cb45-54"><a href="causal-survival-analysis.html#cb45-54" tabindex="-1"></a>hazards.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(qsmk0, qsmk1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;timesq&quot;</span>))</span>
-<span id="cb45-55"><a href="causal-survival-analysis.html#cb45-55" tabindex="-1"></a>hazards.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> hazards.graph<span class="sc">$</span>surv1<span class="sc">-</span>hazards.graph<span class="sc">$</span>surv0</span>
-<span id="cb45-56"><a href="causal-survival-analysis.html#cb45-56" tabindex="-1"></a></span>
-<span id="cb45-57"><a href="causal-survival-analysis.html#cb45-57" tabindex="-1"></a><span class="co"># plot</span></span>
-<span id="cb45-58"><a href="causal-survival-analysis.html#cb45-58" tabindex="-1"></a><span class="fu">ggplot</span>(hazards.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
-<span id="cb45-59"><a href="causal-survival-analysis.html#cb45-59" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb45-60"><a href="causal-survival-analysis.html#cb45-60" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb45-61"><a href="causal-survival-analysis.html#cb45-61" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
-<span id="cb45-62"><a href="causal-survival-analysis.html#cb45-62" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
-<span id="cb45-63"><a href="causal-survival-analysis.html#cb45-63" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
-<span id="cb45-64"><a href="causal-survival-analysis.html#cb45-64" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
-<span id="cb45-65"><a href="causal-survival-analysis.html#cb45-65" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from hazards model&quot;</span>) <span class="sc">+</span></span>
-<span id="cb45-66"><a href="causal-survival-analysis.html#cb45-66" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
-<span id="cb45-67"><a href="causal-survival-analysis.html#cb45-67" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
-<span id="cb45-68"><a href="causal-survival-analysis.html#cb45-68" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb156"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb156-1"><a href="causal-survival-analysis.html#cb156-1" tabindex="-1"></a><span class="co"># creation of person-month data</span></span>
+<span id="cb156-2"><a href="causal-survival-analysis.html#cb156-2" tabindex="-1"></a><span class="co">#install.packages(&quot;splitstackshape&quot;)</span></span>
+<span id="cb156-3"><a href="causal-survival-analysis.html#cb156-3" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;splitstackshape&quot;</span>)</span>
+<span id="cb156-4"><a href="causal-survival-analysis.html#cb156-4" tabindex="-1"></a>nhefs.surv <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="st">&quot;survtime&quot;</span>, <span class="at">drop=</span>F)</span>
+<span id="cb156-5"><a href="causal-survival-analysis.html#cb156-5" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">sequence</span>(<span class="fu">rle</span>(nhefs.surv<span class="sc">$</span>seqn)<span class="sc">$</span>lengths)<span class="sc">-</span><span class="dv">1</span></span>
+<span id="cb156-6"><a href="causal-survival-analysis.html#cb156-6" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>event <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.surv<span class="sc">$</span>time<span class="sc">==</span>nhefs.surv<span class="sc">$</span>survtime<span class="dv">-1</span> <span class="sc">&amp;</span></span>
+<span id="cb156-7"><a href="causal-survival-analysis.html#cb156-7" tabindex="-1"></a>                             nhefs.surv<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb156-8"><a href="causal-survival-analysis.html#cb156-8" tabindex="-1"></a>nhefs.surv<span class="sc">$</span>timesq <span class="ot">&lt;-</span> nhefs.surv<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
+<span id="cb156-9"><a href="causal-survival-analysis.html#cb156-9" tabindex="-1"></a></span>
+<span id="cb156-10"><a href="causal-survival-analysis.html#cb156-10" tabindex="-1"></a><span class="co"># fit of parametric hazards model</span></span>
+<span id="cb156-11"><a href="causal-survival-analysis.html#cb156-11" tabindex="-1"></a>hazards.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq) <span class="sc">+</span></span>
+<span id="cb156-12"><a href="causal-survival-analysis.html#cb156-12" tabindex="-1"></a>                       time <span class="sc">+</span> timesq, <span class="at">family=</span><span class="fu">binomial</span>(), <span class="at">data=</span>nhefs.surv)</span>
+<span id="cb156-13"><a href="causal-survival-analysis.html#cb156-13" tabindex="-1"></a><span class="fu">summary</span>(hazards.model)</span>
+<span id="cb156-14"><a href="causal-survival-analysis.html#cb156-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb156-15"><a href="causal-survival-analysis.html#cb156-15" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb156-16"><a href="causal-survival-analysis.html#cb156-16" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
+<span id="cb156-17"><a href="causal-survival-analysis.html#cb156-17" tabindex="-1"></a><span class="co">#&gt;     time + timesq, family = binomial(), data = nhefs.surv)</span></span>
+<span id="cb156-18"><a href="causal-survival-analysis.html#cb156-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb156-19"><a href="causal-survival-analysis.html#cb156-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb156-20"><a href="causal-survival-analysis.html#cb156-20" tabindex="-1"></a><span class="co">#&gt;                    Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb156-21"><a href="causal-survival-analysis.html#cb156-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)       6.996e+00  2.309e-01  30.292   &lt;2e-16 ***</span></span>
+<span id="cb156-22"><a href="causal-survival-analysis.html#cb156-22" tabindex="-1"></a><span class="co">#&gt; qsmk             -3.355e-01  3.970e-01  -0.845   0.3981    </span></span>
+<span id="cb156-23"><a href="causal-survival-analysis.html#cb156-23" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)   -1.208e-02  1.503e-02  -0.804   0.4215    </span></span>
+<span id="cb156-24"><a href="causal-survival-analysis.html#cb156-24" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)  1.612e-04  1.246e-04   1.293   0.1960    </span></span>
+<span id="cb156-25"><a href="causal-survival-analysis.html#cb156-25" tabindex="-1"></a><span class="co">#&gt; time             -1.960e-02  8.413e-03  -2.329   0.0198 *  </span></span>
+<span id="cb156-26"><a href="causal-survival-analysis.html#cb156-26" tabindex="-1"></a><span class="co">#&gt; timesq            1.256e-04  6.686e-05   1.878   0.0604 .  </span></span>
+<span id="cb156-27"><a href="causal-survival-analysis.html#cb156-27" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb156-28"><a href="causal-survival-analysis.html#cb156-28" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb156-29"><a href="causal-survival-analysis.html#cb156-29" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb156-30"><a href="causal-survival-analysis.html#cb156-30" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb156-31"><a href="causal-survival-analysis.html#cb156-31" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb156-32"><a href="causal-survival-analysis.html#cb156-32" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4655.3  on 176763  degrees of freedom</span></span>
+<span id="cb156-33"><a href="causal-survival-analysis.html#cb156-33" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4631.3  on 176758  degrees of freedom</span></span>
+<span id="cb156-34"><a href="causal-survival-analysis.html#cb156-34" tabindex="-1"></a><span class="co">#&gt; AIC: 4643.3</span></span>
+<span id="cb156-35"><a href="causal-survival-analysis.html#cb156-35" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb156-36"><a href="causal-survival-analysis.html#cb156-36" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 9</span></span></code></pre></div>
+<div class="sourceCode" id="cb157"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb157-1"><a href="causal-survival-analysis.html#cb157-1" tabindex="-1"></a></span>
+<span id="cb157-2"><a href="causal-survival-analysis.html#cb157-2" tabindex="-1"></a><span class="co"># creation of dataset with all time points under each treatment level</span></span>
+<span id="cb157-3"><a href="causal-survival-analysis.html#cb157-3" tabindex="-1"></a>qsmk0 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">0</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb157-4"><a href="causal-survival-analysis.html#cb157-4" tabindex="-1"></a>qsmk1 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">1</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb157-5"><a href="causal-survival-analysis.html#cb157-5" tabindex="-1"></a></span>
+<span id="cb157-6"><a href="causal-survival-analysis.html#cb157-6" tabindex="-1"></a><span class="fu">colnames</span>(qsmk0) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
+<span id="cb157-7"><a href="causal-survival-analysis.html#cb157-7" tabindex="-1"></a><span class="fu">colnames</span>(qsmk1) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
+<span id="cb157-8"><a href="causal-survival-analysis.html#cb157-8" tabindex="-1"></a></span>
+<span id="cb157-9"><a href="causal-survival-analysis.html#cb157-9" tabindex="-1"></a><span class="co"># assignment of estimated (1-hazard) to each person-month */</span></span>
+<span id="cb157-10"><a href="causal-survival-analysis.html#cb157-10" tabindex="-1"></a>qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(hazards.model, qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb157-11"><a href="causal-survival-analysis.html#cb157-11" tabindex="-1"></a>qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(hazards.model, qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb157-12"><a href="causal-survival-analysis.html#cb157-12" tabindex="-1"></a></span>
+<span id="cb157-13"><a href="causal-survival-analysis.html#cb157-13" tabindex="-1"></a><span class="co"># computation of survival for each person-month</span></span>
+<span id="cb157-14"><a href="causal-survival-analysis.html#cb157-14" tabindex="-1"></a>qsmk0<span class="sc">$</span>surv0 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(qsmk0<span class="sc">$</span>p.noevent0)</span>
+<span id="cb157-15"><a href="causal-survival-analysis.html#cb157-15" tabindex="-1"></a>qsmk1<span class="sc">$</span>surv1 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(qsmk1<span class="sc">$</span>p.noevent1)</span>
+<span id="cb157-16"><a href="causal-survival-analysis.html#cb157-16" tabindex="-1"></a></span>
+<span id="cb157-17"><a href="causal-survival-analysis.html#cb157-17" tabindex="-1"></a><span class="co"># some data management to plot estimated survival curves</span></span>
+<span id="cb157-18"><a href="causal-survival-analysis.html#cb157-18" tabindex="-1"></a>hazards.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(qsmk0, qsmk1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;timesq&quot;</span>))</span>
+<span id="cb157-19"><a href="causal-survival-analysis.html#cb157-19" tabindex="-1"></a>hazards.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> hazards.graph<span class="sc">$</span>surv1<span class="sc">-</span>hazards.graph<span class="sc">$</span>surv0</span>
+<span id="cb157-20"><a href="causal-survival-analysis.html#cb157-20" tabindex="-1"></a></span>
+<span id="cb157-21"><a href="causal-survival-analysis.html#cb157-21" tabindex="-1"></a><span class="co"># plot</span></span>
+<span id="cb157-22"><a href="causal-survival-analysis.html#cb157-22" tabindex="-1"></a><span class="fu">ggplot</span>(hazards.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
+<span id="cb157-23"><a href="causal-survival-analysis.html#cb157-23" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb157-24"><a href="causal-survival-analysis.html#cb157-24" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb157-25"><a href="causal-survival-analysis.html#cb157-25" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
+<span id="cb157-26"><a href="causal-survival-analysis.html#cb157-26" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
+<span id="cb157-27"><a href="causal-survival-analysis.html#cb157-27" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
+<span id="cb157-28"><a href="causal-survival-analysis.html#cb157-28" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
+<span id="cb157-29"><a href="causal-survival-analysis.html#cb157-29" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from hazards model&quot;</span>) <span class="sc">+</span></span>
+<span id="cb157-30"><a href="causal-survival-analysis.html#cb157-30" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
+<span id="cb157-31"><a href="causal-survival-analysis.html#cb157-31" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
+<span id="cb157-32"><a href="causal-survival-analysis.html#cb157-32" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
 <p><img src="17-causal-surv-r_files/figure-html/unnamed-chunk-3-1.png" width="85%" style="display: block; margin: auto;" /></p>
 </div>
 <div id="program-17.3" class="section level2 hasAnchor">
@@ -443,93 +443,93 @@ <h2>Program 17.3<a href="causal-survival-analysis.html#program-17.3" class="anch
 <li>Estimation of survival curves via IP weighted hazards model</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb46"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb46-1"><a href="causal-survival-analysis.html#cb46-1" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
-<span id="cb46-2"><a href="causal-survival-analysis.html#cb46-2" tabindex="-1"></a>p.denom <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb46-3"><a href="causal-survival-analysis.html#cb46-3" tabindex="-1"></a>               <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity)</span>
-<span id="cb46-4"><a href="causal-survival-analysis.html#cb46-4" tabindex="-1"></a>               <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb46-5"><a href="causal-survival-analysis.html#cb46-5" tabindex="-1"></a>               <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
-<span id="cb46-6"><a href="causal-survival-analysis.html#cb46-6" tabindex="-1"></a>               <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb46-7"><a href="causal-survival-analysis.html#cb46-7" tabindex="-1"></a>nhefs<span class="sc">$</span>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(p.denom, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb46-8"><a href="causal-survival-analysis.html#cb46-8" tabindex="-1"></a></span>
-<span id="cb46-9"><a href="causal-survival-analysis.html#cb46-9" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
-<span id="cb46-10"><a href="causal-survival-analysis.html#cb46-10" tabindex="-1"></a>p.num <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb46-11"><a href="causal-survival-analysis.html#cb46-11" tabindex="-1"></a>nhefs<span class="sc">$</span>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(p.num, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb46-12"><a href="causal-survival-analysis.html#cb46-12" tabindex="-1"></a></span>
-<span id="cb46-13"><a href="causal-survival-analysis.html#cb46-13" tabindex="-1"></a><span class="co"># computation of estimated weights</span></span>
-<span id="cb46-14"><a href="causal-survival-analysis.html#cb46-14" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.a <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span>, nhefs<span class="sc">$</span>pn.qsmk<span class="sc">/</span>nhefs<span class="sc">$</span>pd.qsmk,</span>
-<span id="cb46-15"><a href="causal-survival-analysis.html#cb46-15" tabindex="-1"></a>                     (<span class="dv">1</span><span class="sc">-</span>nhefs<span class="sc">$</span>pn.qsmk)<span class="sc">/</span>(<span class="dv">1</span><span class="sc">-</span>nhefs<span class="sc">$</span>pd.qsmk))</span>
-<span id="cb46-16"><a href="causal-survival-analysis.html#cb46-16" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.a)</span>
-<span id="cb46-17"><a href="causal-survival-analysis.html#cb46-17" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb46-18"><a href="causal-survival-analysis.html#cb46-18" tabindex="-1"></a><span class="co">#&gt;  0.3312  0.8640  0.9504  0.9991  1.0755  4.2054</span></span>
-<span id="cb46-19"><a href="causal-survival-analysis.html#cb46-19" tabindex="-1"></a></span>
-<span id="cb46-20"><a href="causal-survival-analysis.html#cb46-20" tabindex="-1"></a><span class="co"># creation of person-month data</span></span>
-<span id="cb46-21"><a href="causal-survival-analysis.html#cb46-21" tabindex="-1"></a>nhefs.ipw <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="st">&quot;survtime&quot;</span>, <span class="at">drop=</span>F)</span>
-<span id="cb46-22"><a href="causal-survival-analysis.html#cb46-22" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">sequence</span>(<span class="fu">rle</span>(nhefs.ipw<span class="sc">$</span>seqn)<span class="sc">$</span>lengths)<span class="sc">-</span><span class="dv">1</span></span>
-<span id="cb46-23"><a href="causal-survival-analysis.html#cb46-23" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>event <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.ipw<span class="sc">$</span>time<span class="sc">==</span>nhefs.ipw<span class="sc">$</span>survtime<span class="dv">-1</span> <span class="sc">&amp;</span></span>
-<span id="cb46-24"><a href="causal-survival-analysis.html#cb46-24" tabindex="-1"></a>                            nhefs.ipw<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb46-25"><a href="causal-survival-analysis.html#cb46-25" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>timesq <span class="ot">&lt;-</span> nhefs.ipw<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
-<span id="cb46-26"><a href="causal-survival-analysis.html#cb46-26" tabindex="-1"></a></span>
-<span id="cb46-27"><a href="causal-survival-analysis.html#cb46-27" tabindex="-1"></a><span class="co"># fit of weighted hazards model</span></span>
-<span id="cb46-28"><a href="causal-survival-analysis.html#cb46-28" tabindex="-1"></a>ipw.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq) <span class="sc">+</span></span>
-<span id="cb46-29"><a href="causal-survival-analysis.html#cb46-29" tabindex="-1"></a>                   time <span class="sc">+</span> timesq, <span class="at">family=</span><span class="fu">binomial</span>(), <span class="at">weight=</span>sw.a,</span>
-<span id="cb46-30"><a href="causal-survival-analysis.html#cb46-30" tabindex="-1"></a>                 <span class="at">data=</span>nhefs.ipw)</span>
-<span id="cb46-31"><a href="causal-survival-analysis.html#cb46-31" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb46-32"><a href="causal-survival-analysis.html#cb46-32" tabindex="-1"></a><span class="fu">summary</span>(ipw.model)</span>
-<span id="cb46-33"><a href="causal-survival-analysis.html#cb46-33" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb46-34"><a href="causal-survival-analysis.html#cb46-34" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb46-35"><a href="causal-survival-analysis.html#cb46-35" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
-<span id="cb46-36"><a href="causal-survival-analysis.html#cb46-36" tabindex="-1"></a><span class="co">#&gt;     time + timesq, family = binomial(), data = nhefs.ipw, weights = sw.a)</span></span>
-<span id="cb46-37"><a href="causal-survival-analysis.html#cb46-37" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb46-38"><a href="causal-survival-analysis.html#cb46-38" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb46-39"><a href="causal-survival-analysis.html#cb46-39" tabindex="-1"></a><span class="co">#&gt;                    Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb46-40"><a href="causal-survival-analysis.html#cb46-40" tabindex="-1"></a><span class="co">#&gt; (Intercept)       6.897e+00  2.208e-01  31.242   &lt;2e-16 ***</span></span>
-<span id="cb46-41"><a href="causal-survival-analysis.html#cb46-41" tabindex="-1"></a><span class="co">#&gt; qsmk              1.794e-01  4.399e-01   0.408   0.6834    </span></span>
-<span id="cb46-42"><a href="causal-survival-analysis.html#cb46-42" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)   -1.895e-02  1.640e-02  -1.155   0.2481    </span></span>
-<span id="cb46-43"><a href="causal-survival-analysis.html#cb46-43" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)  2.103e-04  1.352e-04   1.556   0.1198    </span></span>
-<span id="cb46-44"><a href="causal-survival-analysis.html#cb46-44" tabindex="-1"></a><span class="co">#&gt; time             -1.889e-02  8.053e-03  -2.345   0.0190 *  </span></span>
-<span id="cb46-45"><a href="causal-survival-analysis.html#cb46-45" tabindex="-1"></a><span class="co">#&gt; timesq            1.181e-04  6.399e-05   1.846   0.0649 .  </span></span>
-<span id="cb46-46"><a href="causal-survival-analysis.html#cb46-46" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb46-47"><a href="causal-survival-analysis.html#cb46-47" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb46-48"><a href="causal-survival-analysis.html#cb46-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb46-49"><a href="causal-survival-analysis.html#cb46-49" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb46-50"><a href="causal-survival-analysis.html#cb46-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb46-51"><a href="causal-survival-analysis.html#cb46-51" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4643.9  on 176763  degrees of freedom</span></span>
-<span id="cb46-52"><a href="causal-survival-analysis.html#cb46-52" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4626.2  on 176758  degrees of freedom</span></span>
-<span id="cb46-53"><a href="causal-survival-analysis.html#cb46-53" tabindex="-1"></a><span class="co">#&gt; AIC: 4633.5</span></span>
-<span id="cb46-54"><a href="causal-survival-analysis.html#cb46-54" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb46-55"><a href="causal-survival-analysis.html#cb46-55" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 9</span></span>
-<span id="cb46-56"><a href="causal-survival-analysis.html#cb46-56" tabindex="-1"></a></span>
-<span id="cb46-57"><a href="causal-survival-analysis.html#cb46-57" tabindex="-1"></a><span class="co"># creation of survival curves</span></span>
-<span id="cb46-58"><a href="causal-survival-analysis.html#cb46-58" tabindex="-1"></a>ipw.qsmk0 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">0</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb46-59"><a href="causal-survival-analysis.html#cb46-59" tabindex="-1"></a>ipw.qsmk1 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">1</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb46-60"><a href="causal-survival-analysis.html#cb46-60" tabindex="-1"></a></span>
-<span id="cb46-61"><a href="causal-survival-analysis.html#cb46-61" tabindex="-1"></a><span class="fu">colnames</span>(ipw.qsmk0) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
-<span id="cb46-62"><a href="causal-survival-analysis.html#cb46-62" tabindex="-1"></a><span class="fu">colnames</span>(ipw.qsmk1) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
-<span id="cb46-63"><a href="causal-survival-analysis.html#cb46-63" tabindex="-1"></a></span>
-<span id="cb46-64"><a href="causal-survival-analysis.html#cb46-64" tabindex="-1"></a><span class="co"># assignment of estimated (1-hazard) to each person-month */</span></span>
-<span id="cb46-65"><a href="causal-survival-analysis.html#cb46-65" tabindex="-1"></a>ipw.qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(ipw.model, ipw.qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb46-66"><a href="causal-survival-analysis.html#cb46-66" tabindex="-1"></a>ipw.qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(ipw.model, ipw.qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb46-67"><a href="causal-survival-analysis.html#cb46-67" tabindex="-1"></a></span>
-<span id="cb46-68"><a href="causal-survival-analysis.html#cb46-68" tabindex="-1"></a><span class="co"># computation of survival for each person-month</span></span>
-<span id="cb46-69"><a href="causal-survival-analysis.html#cb46-69" tabindex="-1"></a>ipw.qsmk0<span class="sc">$</span>surv0 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(ipw.qsmk0<span class="sc">$</span>p.noevent0)</span>
-<span id="cb46-70"><a href="causal-survival-analysis.html#cb46-70" tabindex="-1"></a>ipw.qsmk1<span class="sc">$</span>surv1 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(ipw.qsmk1<span class="sc">$</span>p.noevent1)</span>
-<span id="cb46-71"><a href="causal-survival-analysis.html#cb46-71" tabindex="-1"></a></span>
-<span id="cb46-72"><a href="causal-survival-analysis.html#cb46-72" tabindex="-1"></a><span class="co"># some data management to plot estimated survival curves</span></span>
-<span id="cb46-73"><a href="causal-survival-analysis.html#cb46-73" tabindex="-1"></a>ipw.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(ipw.qsmk0, ipw.qsmk1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;timesq&quot;</span>))</span>
-<span id="cb46-74"><a href="causal-survival-analysis.html#cb46-74" tabindex="-1"></a>ipw.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> ipw.graph<span class="sc">$</span>surv1<span class="sc">-</span>ipw.graph<span class="sc">$</span>surv0</span>
-<span id="cb46-75"><a href="causal-survival-analysis.html#cb46-75" tabindex="-1"></a></span>
-<span id="cb46-76"><a href="causal-survival-analysis.html#cb46-76" tabindex="-1"></a><span class="co"># plot</span></span>
-<span id="cb46-77"><a href="causal-survival-analysis.html#cb46-77" tabindex="-1"></a><span class="fu">ggplot</span>(ipw.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
-<span id="cb46-78"><a href="causal-survival-analysis.html#cb46-78" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb46-79"><a href="causal-survival-analysis.html#cb46-79" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb46-80"><a href="causal-survival-analysis.html#cb46-80" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
-<span id="cb46-81"><a href="causal-survival-analysis.html#cb46-81" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
-<span id="cb46-82"><a href="causal-survival-analysis.html#cb46-82" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
-<span id="cb46-83"><a href="causal-survival-analysis.html#cb46-83" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
-<span id="cb46-84"><a href="causal-survival-analysis.html#cb46-84" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from IP weighted hazards model&quot;</span>) <span class="sc">+</span></span>
-<span id="cb46-85"><a href="causal-survival-analysis.html#cb46-85" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
-<span id="cb46-86"><a href="causal-survival-analysis.html#cb46-86" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
-<span id="cb46-87"><a href="causal-survival-analysis.html#cb46-87" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb158"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb158-1"><a href="causal-survival-analysis.html#cb158-1" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
+<span id="cb158-2"><a href="causal-survival-analysis.html#cb158-2" tabindex="-1"></a>p.denom <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb158-3"><a href="causal-survival-analysis.html#cb158-3" tabindex="-1"></a>               <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity)</span>
+<span id="cb158-4"><a href="causal-survival-analysis.html#cb158-4" tabindex="-1"></a>               <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb158-5"><a href="causal-survival-analysis.html#cb158-5" tabindex="-1"></a>               <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
+<span id="cb158-6"><a href="causal-survival-analysis.html#cb158-6" tabindex="-1"></a>               <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb158-7"><a href="causal-survival-analysis.html#cb158-7" tabindex="-1"></a>nhefs<span class="sc">$</span>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(p.denom, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb158-8"><a href="causal-survival-analysis.html#cb158-8" tabindex="-1"></a></span>
+<span id="cb158-9"><a href="causal-survival-analysis.html#cb158-9" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
+<span id="cb158-10"><a href="causal-survival-analysis.html#cb158-10" tabindex="-1"></a>p.num <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb158-11"><a href="causal-survival-analysis.html#cb158-11" tabindex="-1"></a>nhefs<span class="sc">$</span>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(p.num, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb158-12"><a href="causal-survival-analysis.html#cb158-12" tabindex="-1"></a></span>
+<span id="cb158-13"><a href="causal-survival-analysis.html#cb158-13" tabindex="-1"></a><span class="co"># computation of estimated weights</span></span>
+<span id="cb158-14"><a href="causal-survival-analysis.html#cb158-14" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.a <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span>, nhefs<span class="sc">$</span>pn.qsmk<span class="sc">/</span>nhefs<span class="sc">$</span>pd.qsmk,</span>
+<span id="cb158-15"><a href="causal-survival-analysis.html#cb158-15" tabindex="-1"></a>                     (<span class="dv">1</span><span class="sc">-</span>nhefs<span class="sc">$</span>pn.qsmk)<span class="sc">/</span>(<span class="dv">1</span><span class="sc">-</span>nhefs<span class="sc">$</span>pd.qsmk))</span>
+<span id="cb158-16"><a href="causal-survival-analysis.html#cb158-16" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.a)</span>
+<span id="cb158-17"><a href="causal-survival-analysis.html#cb158-17" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb158-18"><a href="causal-survival-analysis.html#cb158-18" tabindex="-1"></a><span class="co">#&gt;  0.3312  0.8640  0.9504  0.9991  1.0755  4.2054</span></span></code></pre></div>
+<div class="sourceCode" id="cb159"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb159-1"><a href="causal-survival-analysis.html#cb159-1" tabindex="-1"></a></span>
+<span id="cb159-2"><a href="causal-survival-analysis.html#cb159-2" tabindex="-1"></a><span class="co"># creation of person-month data</span></span>
+<span id="cb159-3"><a href="causal-survival-analysis.html#cb159-3" tabindex="-1"></a>nhefs.ipw <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="st">&quot;survtime&quot;</span>, <span class="at">drop=</span>F)</span>
+<span id="cb159-4"><a href="causal-survival-analysis.html#cb159-4" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">sequence</span>(<span class="fu">rle</span>(nhefs.ipw<span class="sc">$</span>seqn)<span class="sc">$</span>lengths)<span class="sc">-</span><span class="dv">1</span></span>
+<span id="cb159-5"><a href="causal-survival-analysis.html#cb159-5" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>event <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.ipw<span class="sc">$</span>time<span class="sc">==</span>nhefs.ipw<span class="sc">$</span>survtime<span class="dv">-1</span> <span class="sc">&amp;</span></span>
+<span id="cb159-6"><a href="causal-survival-analysis.html#cb159-6" tabindex="-1"></a>                            nhefs.ipw<span class="sc">$</span>death<span class="sc">==</span><span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb159-7"><a href="causal-survival-analysis.html#cb159-7" tabindex="-1"></a>nhefs.ipw<span class="sc">$</span>timesq <span class="ot">&lt;-</span> nhefs.ipw<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
+<span id="cb159-8"><a href="causal-survival-analysis.html#cb159-8" tabindex="-1"></a></span>
+<span id="cb159-9"><a href="causal-survival-analysis.html#cb159-9" tabindex="-1"></a><span class="co"># fit of weighted hazards model</span></span>
+<span id="cb159-10"><a href="causal-survival-analysis.html#cb159-10" tabindex="-1"></a>ipw.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq) <span class="sc">+</span></span>
+<span id="cb159-11"><a href="causal-survival-analysis.html#cb159-11" tabindex="-1"></a>                   time <span class="sc">+</span> timesq, <span class="at">family=</span><span class="fu">binomial</span>(), <span class="at">weight=</span>sw.a,</span>
+<span id="cb159-12"><a href="causal-survival-analysis.html#cb159-12" tabindex="-1"></a>                 <span class="at">data=</span>nhefs.ipw)</span>
+<span id="cb159-13"><a href="causal-survival-analysis.html#cb159-13" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span></code></pre></div>
+<div class="sourceCode" id="cb160"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb160-1"><a href="causal-survival-analysis.html#cb160-1" tabindex="-1"></a><span class="fu">summary</span>(ipw.model)</span>
+<span id="cb160-2"><a href="causal-survival-analysis.html#cb160-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb160-3"><a href="causal-survival-analysis.html#cb160-3" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb160-4"><a href="causal-survival-analysis.html#cb160-4" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
+<span id="cb160-5"><a href="causal-survival-analysis.html#cb160-5" tabindex="-1"></a><span class="co">#&gt;     time + timesq, family = binomial(), data = nhefs.ipw, weights = sw.a)</span></span>
+<span id="cb160-6"><a href="causal-survival-analysis.html#cb160-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb160-7"><a href="causal-survival-analysis.html#cb160-7" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb160-8"><a href="causal-survival-analysis.html#cb160-8" tabindex="-1"></a><span class="co">#&gt;                    Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb160-9"><a href="causal-survival-analysis.html#cb160-9" tabindex="-1"></a><span class="co">#&gt; (Intercept)       6.897e+00  2.208e-01  31.242   &lt;2e-16 ***</span></span>
+<span id="cb160-10"><a href="causal-survival-analysis.html#cb160-10" tabindex="-1"></a><span class="co">#&gt; qsmk              1.794e-01  4.399e-01   0.408   0.6834    </span></span>
+<span id="cb160-11"><a href="causal-survival-analysis.html#cb160-11" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)   -1.895e-02  1.640e-02  -1.155   0.2481    </span></span>
+<span id="cb160-12"><a href="causal-survival-analysis.html#cb160-12" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)  2.103e-04  1.352e-04   1.556   0.1198    </span></span>
+<span id="cb160-13"><a href="causal-survival-analysis.html#cb160-13" tabindex="-1"></a><span class="co">#&gt; time             -1.889e-02  8.053e-03  -2.345   0.0190 *  </span></span>
+<span id="cb160-14"><a href="causal-survival-analysis.html#cb160-14" tabindex="-1"></a><span class="co">#&gt; timesq            1.181e-04  6.399e-05   1.846   0.0649 .  </span></span>
+<span id="cb160-15"><a href="causal-survival-analysis.html#cb160-15" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb160-16"><a href="causal-survival-analysis.html#cb160-16" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb160-17"><a href="causal-survival-analysis.html#cb160-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb160-18"><a href="causal-survival-analysis.html#cb160-18" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb160-19"><a href="causal-survival-analysis.html#cb160-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb160-20"><a href="causal-survival-analysis.html#cb160-20" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4643.9  on 176763  degrees of freedom</span></span>
+<span id="cb160-21"><a href="causal-survival-analysis.html#cb160-21" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4626.2  on 176758  degrees of freedom</span></span>
+<span id="cb160-22"><a href="causal-survival-analysis.html#cb160-22" tabindex="-1"></a><span class="co">#&gt; AIC: 4633.5</span></span>
+<span id="cb160-23"><a href="causal-survival-analysis.html#cb160-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb160-24"><a href="causal-survival-analysis.html#cb160-24" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 9</span></span></code></pre></div>
+<div class="sourceCode" id="cb161"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb161-1"><a href="causal-survival-analysis.html#cb161-1" tabindex="-1"></a></span>
+<span id="cb161-2"><a href="causal-survival-analysis.html#cb161-2" tabindex="-1"></a><span class="co"># creation of survival curves</span></span>
+<span id="cb161-3"><a href="causal-survival-analysis.html#cb161-3" tabindex="-1"></a>ipw.qsmk0 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">0</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb161-4"><a href="causal-survival-analysis.html#cb161-4" tabindex="-1"></a>ipw.qsmk1 <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>),<span class="dv">1</span>,(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>))<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb161-5"><a href="causal-survival-analysis.html#cb161-5" tabindex="-1"></a></span>
+<span id="cb161-6"><a href="causal-survival-analysis.html#cb161-6" tabindex="-1"></a><span class="fu">colnames</span>(ipw.qsmk0) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
+<span id="cb161-7"><a href="causal-survival-analysis.html#cb161-7" tabindex="-1"></a><span class="fu">colnames</span>(ipw.qsmk1) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;timesq&quot;</span>)</span>
+<span id="cb161-8"><a href="causal-survival-analysis.html#cb161-8" tabindex="-1"></a></span>
+<span id="cb161-9"><a href="causal-survival-analysis.html#cb161-9" tabindex="-1"></a><span class="co"># assignment of estimated (1-hazard) to each person-month */</span></span>
+<span id="cb161-10"><a href="causal-survival-analysis.html#cb161-10" tabindex="-1"></a>ipw.qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(ipw.model, ipw.qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb161-11"><a href="causal-survival-analysis.html#cb161-11" tabindex="-1"></a>ipw.qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(ipw.model, ipw.qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb161-12"><a href="causal-survival-analysis.html#cb161-12" tabindex="-1"></a></span>
+<span id="cb161-13"><a href="causal-survival-analysis.html#cb161-13" tabindex="-1"></a><span class="co"># computation of survival for each person-month</span></span>
+<span id="cb161-14"><a href="causal-survival-analysis.html#cb161-14" tabindex="-1"></a>ipw.qsmk0<span class="sc">$</span>surv0 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(ipw.qsmk0<span class="sc">$</span>p.noevent0)</span>
+<span id="cb161-15"><a href="causal-survival-analysis.html#cb161-15" tabindex="-1"></a>ipw.qsmk1<span class="sc">$</span>surv1 <span class="ot">&lt;-</span> <span class="fu">cumprod</span>(ipw.qsmk1<span class="sc">$</span>p.noevent1)</span>
+<span id="cb161-16"><a href="causal-survival-analysis.html#cb161-16" tabindex="-1"></a></span>
+<span id="cb161-17"><a href="causal-survival-analysis.html#cb161-17" tabindex="-1"></a><span class="co"># some data management to plot estimated survival curves</span></span>
+<span id="cb161-18"><a href="causal-survival-analysis.html#cb161-18" tabindex="-1"></a>ipw.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(ipw.qsmk0, ipw.qsmk1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>, <span class="st">&quot;timesq&quot;</span>))</span>
+<span id="cb161-19"><a href="causal-survival-analysis.html#cb161-19" tabindex="-1"></a>ipw.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> ipw.graph<span class="sc">$</span>surv1<span class="sc">-</span>ipw.graph<span class="sc">$</span>surv0</span>
+<span id="cb161-20"><a href="causal-survival-analysis.html#cb161-20" tabindex="-1"></a></span>
+<span id="cb161-21"><a href="causal-survival-analysis.html#cb161-21" tabindex="-1"></a><span class="co"># plot</span></span>
+<span id="cb161-22"><a href="causal-survival-analysis.html#cb161-22" tabindex="-1"></a><span class="fu">ggplot</span>(ipw.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
+<span id="cb161-23"><a href="causal-survival-analysis.html#cb161-23" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb161-24"><a href="causal-survival-analysis.html#cb161-24" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb161-25"><a href="causal-survival-analysis.html#cb161-25" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
+<span id="cb161-26"><a href="causal-survival-analysis.html#cb161-26" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
+<span id="cb161-27"><a href="causal-survival-analysis.html#cb161-27" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
+<span id="cb161-28"><a href="causal-survival-analysis.html#cb161-28" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
+<span id="cb161-29"><a href="causal-survival-analysis.html#cb161-29" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from IP weighted hazards model&quot;</span>) <span class="sc">+</span></span>
+<span id="cb161-30"><a href="causal-survival-analysis.html#cb161-30" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
+<span id="cb161-31"><a href="causal-survival-analysis.html#cb161-31" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
+<span id="cb161-32"><a href="causal-survival-analysis.html#cb161-32" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
 <p><img src="17-causal-surv-r_files/figure-html/unnamed-chunk-4-1.png" width="85%" style="display: block; margin: auto;" /></p>
 </div>
 <div id="program-17.4" class="section level2 hasAnchor">
@@ -538,112 +538,112 @@ <h2>Program 17.4<a href="causal-survival-analysis.html#program-17.4" class="anch
 <li>Estimating of survival curves via g-formula</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb47"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb47-1"><a href="causal-survival-analysis.html#cb47-1" tabindex="-1"></a><span class="co"># fit of hazards model with covariates</span></span>
-<span id="cb47-2"><a href="causal-survival-analysis.html#cb47-2" tabindex="-1"></a>gf.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq)</span>
-<span id="cb47-3"><a href="causal-survival-analysis.html#cb47-3" tabindex="-1"></a>                <span class="sc">+</span> time <span class="sc">+</span> timesq <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
-<span id="cb47-4"><a href="causal-survival-analysis.html#cb47-4" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
-<span id="cb47-5"><a href="causal-survival-analysis.html#cb47-5" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smkintensity82_71</span>
-<span id="cb47-6"><a href="causal-survival-analysis.html#cb47-6" tabindex="-1"></a>                <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb47-7"><a href="causal-survival-analysis.html#cb47-7" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
-<span id="cb47-8"><a href="causal-survival-analysis.html#cb47-8" tabindex="-1"></a>                <span class="at">data=</span>nhefs.surv, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb47-9"><a href="causal-survival-analysis.html#cb47-9" tabindex="-1"></a><span class="fu">summary</span>(gf.model)</span>
-<span id="cb47-10"><a href="causal-survival-analysis.html#cb47-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-11"><a href="causal-survival-analysis.html#cb47-11" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb47-12"><a href="causal-survival-analysis.html#cb47-12" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
-<span id="cb47-13"><a href="causal-survival-analysis.html#cb47-13" tabindex="-1"></a><span class="co">#&gt;     time + timesq + sex + race + age + I(age * age) + as.factor(education) + </span></span>
-<span id="cb47-14"><a href="causal-survival-analysis.html#cb47-14" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smkintensity82_71 + </span></span>
-<span id="cb47-15"><a href="causal-survival-analysis.html#cb47-15" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb47-16"><a href="causal-survival-analysis.html#cb47-16" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71), family = binomial(), </span></span>
-<span id="cb47-17"><a href="causal-survival-analysis.html#cb47-17" tabindex="-1"></a><span class="co">#&gt;     data = nhefs.surv)</span></span>
-<span id="cb47-18"><a href="causal-survival-analysis.html#cb47-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-19"><a href="causal-survival-analysis.html#cb47-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb47-20"><a href="causal-survival-analysis.html#cb47-20" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb47-21"><a href="causal-survival-analysis.html#cb47-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)                         9.272e+00  1.379e+00   6.724 1.76e-11 ***</span></span>
-<span id="cb47-22"><a href="causal-survival-analysis.html#cb47-22" tabindex="-1"></a><span class="co">#&gt; qsmk                                5.959e-02  4.154e-01   0.143 0.885924    </span></span>
-<span id="cb47-23"><a href="causal-survival-analysis.html#cb47-23" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)                     -1.485e-02  1.506e-02  -0.987 0.323824    </span></span>
-<span id="cb47-24"><a href="causal-survival-analysis.html#cb47-24" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)                    1.702e-04  1.245e-04   1.367 0.171643    </span></span>
-<span id="cb47-25"><a href="causal-survival-analysis.html#cb47-25" tabindex="-1"></a><span class="co">#&gt; time                               -2.270e-02  8.437e-03  -2.690 0.007142 ** </span></span>
-<span id="cb47-26"><a href="causal-survival-analysis.html#cb47-26" tabindex="-1"></a><span class="co">#&gt; timesq                              1.174e-04  6.709e-05   1.751 0.080020 .  </span></span>
-<span id="cb47-27"><a href="causal-survival-analysis.html#cb47-27" tabindex="-1"></a><span class="co">#&gt; sex                                 4.368e-01  1.409e-01   3.101 0.001930 ** </span></span>
-<span id="cb47-28"><a href="causal-survival-analysis.html#cb47-28" tabindex="-1"></a><span class="co">#&gt; race                               -5.240e-02  1.734e-01  -0.302 0.762572    </span></span>
-<span id="cb47-29"><a href="causal-survival-analysis.html#cb47-29" tabindex="-1"></a><span class="co">#&gt; age                                -8.750e-02  5.907e-02  -1.481 0.138536    </span></span>
-<span id="cb47-30"><a href="causal-survival-analysis.html#cb47-30" tabindex="-1"></a><span class="co">#&gt; I(age * age)                        8.128e-05  5.470e-04   0.149 0.881865    </span></span>
-<span id="cb47-31"><a href="causal-survival-analysis.html#cb47-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               1.401e-01  1.566e-01   0.895 0.370980    </span></span>
-<span id="cb47-32"><a href="causal-survival-analysis.html#cb47-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               4.335e-01  1.526e-01   2.841 0.004502 ** </span></span>
-<span id="cb47-33"><a href="causal-survival-analysis.html#cb47-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               2.350e-01  2.790e-01   0.842 0.399750    </span></span>
-<span id="cb47-34"><a href="causal-survival-analysis.html#cb47-34" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               3.750e-01  2.386e-01   1.571 0.116115    </span></span>
-<span id="cb47-35"><a href="causal-survival-analysis.html#cb47-35" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -1.626e-03  1.430e-02  -0.114 0.909431    </span></span>
-<span id="cb47-36"><a href="causal-survival-analysis.html#cb47-36" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -7.182e-05  2.390e-04  -0.301 0.763741    </span></span>
-<span id="cb47-37"><a href="causal-survival-analysis.html#cb47-37" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                  -1.686e-03  6.501e-03  -0.259 0.795399    </span></span>
-<span id="cb47-38"><a href="causal-survival-analysis.html#cb47-38" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -1.677e-02  3.065e-02  -0.547 0.584153    </span></span>
-<span id="cb47-39"><a href="causal-survival-analysis.html#cb47-39" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -5.280e-05  4.244e-04  -0.124 0.900997    </span></span>
-<span id="cb47-40"><a href="causal-survival-analysis.html#cb47-40" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                1.469e-01  1.792e-01   0.820 0.412300    </span></span>
-<span id="cb47-41"><a href="causal-survival-analysis.html#cb47-41" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2               -1.504e-01  1.762e-01  -0.854 0.393177    </span></span>
-<span id="cb47-42"><a href="causal-survival-analysis.html#cb47-42" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -1.601e-01  1.300e-01  -1.232 0.218048    </span></span>
-<span id="cb47-43"><a href="causal-survival-analysis.html#cb47-43" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -2.294e-01  1.877e-01  -1.222 0.221766    </span></span>
-<span id="cb47-44"><a href="causal-survival-analysis.html#cb47-44" tabindex="-1"></a><span class="co">#&gt; wt71                                6.222e-02  1.902e-02   3.271 0.001073 ** </span></span>
-<span id="cb47-45"><a href="causal-survival-analysis.html#cb47-45" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -4.046e-04  1.129e-04  -3.584 0.000338 ***</span></span>
-<span id="cb47-46"><a href="causal-survival-analysis.html#cb47-46" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb47-47"><a href="causal-survival-analysis.html#cb47-47" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb47-48"><a href="causal-survival-analysis.html#cb47-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-49"><a href="causal-survival-analysis.html#cb47-49" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb47-50"><a href="causal-survival-analysis.html#cb47-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-51"><a href="causal-survival-analysis.html#cb47-51" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4655.3  on 176763  degrees of freedom</span></span>
-<span id="cb47-52"><a href="causal-survival-analysis.html#cb47-52" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4185.7  on 176739  degrees of freedom</span></span>
-<span id="cb47-53"><a href="causal-survival-analysis.html#cb47-53" tabindex="-1"></a><span class="co">#&gt; AIC: 4235.7</span></span>
-<span id="cb47-54"><a href="causal-survival-analysis.html#cb47-54" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-55"><a href="causal-survival-analysis.html#cb47-55" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 10</span></span>
-<span id="cb47-56"><a href="causal-survival-analysis.html#cb47-56" tabindex="-1"></a></span>
-<span id="cb47-57"><a href="causal-survival-analysis.html#cb47-57" tabindex="-1"></a><span class="co"># creation of dataset with all time points for</span></span>
-<span id="cb47-58"><a href="causal-survival-analysis.html#cb47-58" tabindex="-1"></a><span class="co"># each individual under each treatment level</span></span>
-<span id="cb47-59"><a href="causal-survival-analysis.html#cb47-59" tabindex="-1"></a>gf.qsmk0 <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="at">count=</span><span class="dv">120</span>, <span class="at">count.is.col=</span>F)</span>
-<span id="cb47-60"><a href="causal-survival-analysis.html#cb47-60" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>), <span class="fu">nrow</span>(nhefs))</span>
-<span id="cb47-61"><a href="causal-survival-analysis.html#cb47-61" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>timesq <span class="ot">&lt;-</span> gf.qsmk0<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
-<span id="cb47-62"><a href="causal-survival-analysis.html#cb47-62" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb47-63"><a href="causal-survival-analysis.html#cb47-63" tabindex="-1"></a></span>
-<span id="cb47-64"><a href="causal-survival-analysis.html#cb47-64" tabindex="-1"></a>gf.qsmk1 <span class="ot">&lt;-</span> gf.qsmk0</span>
-<span id="cb47-65"><a href="causal-survival-analysis.html#cb47-65" tabindex="-1"></a>gf.qsmk1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb47-66"><a href="causal-survival-analysis.html#cb47-66" tabindex="-1"></a></span>
-<span id="cb47-67"><a href="causal-survival-analysis.html#cb47-67" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(gf.model, gf.qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb47-68"><a href="causal-survival-analysis.html#cb47-68" tabindex="-1"></a>gf.qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(gf.model, gf.qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb47-69"><a href="causal-survival-analysis.html#cb47-69" tabindex="-1"></a></span>
-<span id="cb47-70"><a href="causal-survival-analysis.html#cb47-70" tabindex="-1"></a><span class="co">#install.packages(&quot;dplyr&quot;)</span></span>
-<span id="cb47-71"><a href="causal-survival-analysis.html#cb47-71" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;dplyr&quot;</span>)</span>
-<span id="cb47-72"><a href="causal-survival-analysis.html#cb47-72" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-73"><a href="causal-survival-analysis.html#cb47-73" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;dplyr&#39;</span></span>
-<span id="cb47-74"><a href="causal-survival-analysis.html#cb47-74" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:stats&#39;:</span></span>
-<span id="cb47-75"><a href="causal-survival-analysis.html#cb47-75" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-76"><a href="causal-survival-analysis.html#cb47-76" tabindex="-1"></a><span class="co">#&gt;     filter, lag</span></span>
-<span id="cb47-77"><a href="causal-survival-analysis.html#cb47-77" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
-<span id="cb47-78"><a href="causal-survival-analysis.html#cb47-78" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb47-79"><a href="causal-survival-analysis.html#cb47-79" tabindex="-1"></a><span class="co">#&gt;     intersect, setdiff, setequal, union</span></span>
-<span id="cb47-80"><a href="causal-survival-analysis.html#cb47-80" tabindex="-1"></a>gf.qsmk0.surv <span class="ot">&lt;-</span> gf.qsmk0 <span class="sc">%&gt;%</span> <span class="fu">group_by</span>(seqn) <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">surv0 =</span> <span class="fu">cumprod</span>(p.noevent0))</span>
-<span id="cb47-81"><a href="causal-survival-analysis.html#cb47-81" tabindex="-1"></a>gf.qsmk1.surv <span class="ot">&lt;-</span> gf.qsmk1 <span class="sc">%&gt;%</span> <span class="fu">group_by</span>(seqn) <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">surv1 =</span> <span class="fu">cumprod</span>(p.noevent1))</span>
-<span id="cb47-82"><a href="causal-survival-analysis.html#cb47-82" tabindex="-1"></a></span>
-<span id="cb47-83"><a href="causal-survival-analysis.html#cb47-83" tabindex="-1"></a>gf.surv0 <span class="ot">&lt;-</span></span>
-<span id="cb47-84"><a href="causal-survival-analysis.html#cb47-84" tabindex="-1"></a>  <span class="fu">aggregate</span>(gf.qsmk0.surv,</span>
-<span id="cb47-85"><a href="causal-survival-analysis.html#cb47-85" tabindex="-1"></a>            <span class="at">by =</span> <span class="fu">list</span>(gf.qsmk0.surv<span class="sc">$</span>time),</span>
-<span id="cb47-86"><a href="causal-survival-analysis.html#cb47-86" tabindex="-1"></a>            <span class="at">FUN =</span> mean)[<span class="fu">c</span>(<span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;time&quot;</span>, <span class="st">&quot;surv0&quot;</span>)]</span>
-<span id="cb47-87"><a href="causal-survival-analysis.html#cb47-87" tabindex="-1"></a>gf.surv1 <span class="ot">&lt;-</span></span>
-<span id="cb47-88"><a href="causal-survival-analysis.html#cb47-88" tabindex="-1"></a>  <span class="fu">aggregate</span>(gf.qsmk1.surv,</span>
-<span id="cb47-89"><a href="causal-survival-analysis.html#cb47-89" tabindex="-1"></a>            <span class="at">by =</span> <span class="fu">list</span>(gf.qsmk1.surv<span class="sc">$</span>time),</span>
-<span id="cb47-90"><a href="causal-survival-analysis.html#cb47-90" tabindex="-1"></a>            <span class="at">FUN =</span> mean)[<span class="fu">c</span>(<span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;time&quot;</span>, <span class="st">&quot;surv1&quot;</span>)]</span>
-<span id="cb47-91"><a href="causal-survival-analysis.html#cb47-91" tabindex="-1"></a></span>
-<span id="cb47-92"><a href="causal-survival-analysis.html#cb47-92" tabindex="-1"></a>gf.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(gf.surv0, gf.surv1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>))</span>
-<span id="cb47-93"><a href="causal-survival-analysis.html#cb47-93" tabindex="-1"></a>gf.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> gf.graph<span class="sc">$</span>surv1<span class="sc">-</span>gf.graph<span class="sc">$</span>surv0</span>
-<span id="cb47-94"><a href="causal-survival-analysis.html#cb47-94" tabindex="-1"></a></span>
-<span id="cb47-95"><a href="causal-survival-analysis.html#cb47-95" tabindex="-1"></a><span class="co"># plot</span></span>
-<span id="cb47-96"><a href="causal-survival-analysis.html#cb47-96" tabindex="-1"></a><span class="fu">ggplot</span>(gf.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
-<span id="cb47-97"><a href="causal-survival-analysis.html#cb47-97" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb47-98"><a href="causal-survival-analysis.html#cb47-98" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb47-99"><a href="causal-survival-analysis.html#cb47-99" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
-<span id="cb47-100"><a href="causal-survival-analysis.html#cb47-100" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
-<span id="cb47-101"><a href="causal-survival-analysis.html#cb47-101" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
-<span id="cb47-102"><a href="causal-survival-analysis.html#cb47-102" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
-<span id="cb47-103"><a href="causal-survival-analysis.html#cb47-103" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from g-formula&quot;</span>) <span class="sc">+</span></span>
-<span id="cb47-104"><a href="causal-survival-analysis.html#cb47-104" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
-<span id="cb47-105"><a href="causal-survival-analysis.html#cb47-105" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
-<span id="cb47-106"><a href="causal-survival-analysis.html#cb47-106" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb162"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb162-1"><a href="causal-survival-analysis.html#cb162-1" tabindex="-1"></a><span class="co"># fit of hazards model with covariates</span></span>
+<span id="cb162-2"><a href="causal-survival-analysis.html#cb162-2" tabindex="-1"></a>gf.model <span class="ot">&lt;-</span> <span class="fu">glm</span>(event<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>time) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>timesq)</span>
+<span id="cb162-3"><a href="causal-survival-analysis.html#cb162-3" tabindex="-1"></a>                <span class="sc">+</span> time <span class="sc">+</span> timesq <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
+<span id="cb162-4"><a href="causal-survival-analysis.html#cb162-4" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
+<span id="cb162-5"><a href="causal-survival-analysis.html#cb162-5" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smkintensity82_71</span>
+<span id="cb162-6"><a href="causal-survival-analysis.html#cb162-6" tabindex="-1"></a>                <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb162-7"><a href="causal-survival-analysis.html#cb162-7" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
+<span id="cb162-8"><a href="causal-survival-analysis.html#cb162-8" tabindex="-1"></a>                <span class="at">data=</span>nhefs.surv, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb162-9"><a href="causal-survival-analysis.html#cb162-9" tabindex="-1"></a><span class="fu">summary</span>(gf.model)</span>
+<span id="cb162-10"><a href="causal-survival-analysis.html#cb162-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb162-11"><a href="causal-survival-analysis.html#cb162-11" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb162-12"><a href="causal-survival-analysis.html#cb162-12" tabindex="-1"></a><span class="co">#&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + </span></span>
+<span id="cb162-13"><a href="causal-survival-analysis.html#cb162-13" tabindex="-1"></a><span class="co">#&gt;     time + timesq + sex + race + age + I(age * age) + as.factor(education) + </span></span>
+<span id="cb162-14"><a href="causal-survival-analysis.html#cb162-14" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smkintensity82_71 + </span></span>
+<span id="cb162-15"><a href="causal-survival-analysis.html#cb162-15" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb162-16"><a href="causal-survival-analysis.html#cb162-16" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71), family = binomial(), </span></span>
+<span id="cb162-17"><a href="causal-survival-analysis.html#cb162-17" tabindex="-1"></a><span class="co">#&gt;     data = nhefs.surv)</span></span>
+<span id="cb162-18"><a href="causal-survival-analysis.html#cb162-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb162-19"><a href="causal-survival-analysis.html#cb162-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb162-20"><a href="causal-survival-analysis.html#cb162-20" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb162-21"><a href="causal-survival-analysis.html#cb162-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)                         9.272e+00  1.379e+00   6.724 1.76e-11 ***</span></span>
+<span id="cb162-22"><a href="causal-survival-analysis.html#cb162-22" tabindex="-1"></a><span class="co">#&gt; qsmk                                5.959e-02  4.154e-01   0.143 0.885924    </span></span>
+<span id="cb162-23"><a href="causal-survival-analysis.html#cb162-23" tabindex="-1"></a><span class="co">#&gt; I(qsmk * time)                     -1.485e-02  1.506e-02  -0.987 0.323824    </span></span>
+<span id="cb162-24"><a href="causal-survival-analysis.html#cb162-24" tabindex="-1"></a><span class="co">#&gt; I(qsmk * timesq)                    1.702e-04  1.245e-04   1.367 0.171643    </span></span>
+<span id="cb162-25"><a href="causal-survival-analysis.html#cb162-25" tabindex="-1"></a><span class="co">#&gt; time                               -2.270e-02  8.437e-03  -2.690 0.007142 ** </span></span>
+<span id="cb162-26"><a href="causal-survival-analysis.html#cb162-26" tabindex="-1"></a><span class="co">#&gt; timesq                              1.174e-04  6.709e-05   1.751 0.080020 .  </span></span>
+<span id="cb162-27"><a href="causal-survival-analysis.html#cb162-27" tabindex="-1"></a><span class="co">#&gt; sex                                 4.368e-01  1.409e-01   3.101 0.001930 ** </span></span>
+<span id="cb162-28"><a href="causal-survival-analysis.html#cb162-28" tabindex="-1"></a><span class="co">#&gt; race                               -5.240e-02  1.734e-01  -0.302 0.762572    </span></span>
+<span id="cb162-29"><a href="causal-survival-analysis.html#cb162-29" tabindex="-1"></a><span class="co">#&gt; age                                -8.750e-02  5.907e-02  -1.481 0.138536    </span></span>
+<span id="cb162-30"><a href="causal-survival-analysis.html#cb162-30" tabindex="-1"></a><span class="co">#&gt; I(age * age)                        8.128e-05  5.470e-04   0.149 0.881865    </span></span>
+<span id="cb162-31"><a href="causal-survival-analysis.html#cb162-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               1.401e-01  1.566e-01   0.895 0.370980    </span></span>
+<span id="cb162-32"><a href="causal-survival-analysis.html#cb162-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               4.335e-01  1.526e-01   2.841 0.004502 ** </span></span>
+<span id="cb162-33"><a href="causal-survival-analysis.html#cb162-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               2.350e-01  2.790e-01   0.842 0.399750    </span></span>
+<span id="cb162-34"><a href="causal-survival-analysis.html#cb162-34" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               3.750e-01  2.386e-01   1.571 0.116115    </span></span>
+<span id="cb162-35"><a href="causal-survival-analysis.html#cb162-35" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -1.626e-03  1.430e-02  -0.114 0.909431    </span></span>
+<span id="cb162-36"><a href="causal-survival-analysis.html#cb162-36" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -7.182e-05  2.390e-04  -0.301 0.763741    </span></span>
+<span id="cb162-37"><a href="causal-survival-analysis.html#cb162-37" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                  -1.686e-03  6.501e-03  -0.259 0.795399    </span></span>
+<span id="cb162-38"><a href="causal-survival-analysis.html#cb162-38" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -1.677e-02  3.065e-02  -0.547 0.584153    </span></span>
+<span id="cb162-39"><a href="causal-survival-analysis.html#cb162-39" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -5.280e-05  4.244e-04  -0.124 0.900997    </span></span>
+<span id="cb162-40"><a href="causal-survival-analysis.html#cb162-40" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                1.469e-01  1.792e-01   0.820 0.412300    </span></span>
+<span id="cb162-41"><a href="causal-survival-analysis.html#cb162-41" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2               -1.504e-01  1.762e-01  -0.854 0.393177    </span></span>
+<span id="cb162-42"><a href="causal-survival-analysis.html#cb162-42" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -1.601e-01  1.300e-01  -1.232 0.218048    </span></span>
+<span id="cb162-43"><a href="causal-survival-analysis.html#cb162-43" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -2.294e-01  1.877e-01  -1.222 0.221766    </span></span>
+<span id="cb162-44"><a href="causal-survival-analysis.html#cb162-44" tabindex="-1"></a><span class="co">#&gt; wt71                                6.222e-02  1.902e-02   3.271 0.001073 ** </span></span>
+<span id="cb162-45"><a href="causal-survival-analysis.html#cb162-45" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -4.046e-04  1.129e-04  -3.584 0.000338 ***</span></span>
+<span id="cb162-46"><a href="causal-survival-analysis.html#cb162-46" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb162-47"><a href="causal-survival-analysis.html#cb162-47" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb162-48"><a href="causal-survival-analysis.html#cb162-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb162-49"><a href="causal-survival-analysis.html#cb162-49" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb162-50"><a href="causal-survival-analysis.html#cb162-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb162-51"><a href="causal-survival-analysis.html#cb162-51" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 4655.3  on 176763  degrees of freedom</span></span>
+<span id="cb162-52"><a href="causal-survival-analysis.html#cb162-52" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4185.7  on 176739  degrees of freedom</span></span>
+<span id="cb162-53"><a href="causal-survival-analysis.html#cb162-53" tabindex="-1"></a><span class="co">#&gt; AIC: 4235.7</span></span>
+<span id="cb162-54"><a href="causal-survival-analysis.html#cb162-54" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb162-55"><a href="causal-survival-analysis.html#cb162-55" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 10</span></span></code></pre></div>
+<div class="sourceCode" id="cb163"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb163-1"><a href="causal-survival-analysis.html#cb163-1" tabindex="-1"></a></span>
+<span id="cb163-2"><a href="causal-survival-analysis.html#cb163-2" tabindex="-1"></a><span class="co"># creation of dataset with all time points for</span></span>
+<span id="cb163-3"><a href="causal-survival-analysis.html#cb163-3" tabindex="-1"></a><span class="co"># each individual under each treatment level</span></span>
+<span id="cb163-4"><a href="causal-survival-analysis.html#cb163-4" tabindex="-1"></a>gf.qsmk0 <span class="ot">&lt;-</span> <span class="fu">expandRows</span>(nhefs, <span class="at">count=</span><span class="dv">120</span>, <span class="at">count.is.col=</span>F)</span>
+<span id="cb163-5"><a href="causal-survival-analysis.html#cb163-5" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>time <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">119</span>), <span class="fu">nrow</span>(nhefs))</span>
+<span id="cb163-6"><a href="causal-survival-analysis.html#cb163-6" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>timesq <span class="ot">&lt;-</span> gf.qsmk0<span class="sc">$</span>time<span class="sc">^</span><span class="dv">2</span></span>
+<span id="cb163-7"><a href="causal-survival-analysis.html#cb163-7" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb163-8"><a href="causal-survival-analysis.html#cb163-8" tabindex="-1"></a></span>
+<span id="cb163-9"><a href="causal-survival-analysis.html#cb163-9" tabindex="-1"></a>gf.qsmk1 <span class="ot">&lt;-</span> gf.qsmk0</span>
+<span id="cb163-10"><a href="causal-survival-analysis.html#cb163-10" tabindex="-1"></a>gf.qsmk1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb163-11"><a href="causal-survival-analysis.html#cb163-11" tabindex="-1"></a></span>
+<span id="cb163-12"><a href="causal-survival-analysis.html#cb163-12" tabindex="-1"></a>gf.qsmk0<span class="sc">$</span>p.noevent0 <span class="ot">&lt;-</span> <span class="fu">predict</span>(gf.model, gf.qsmk0, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb163-13"><a href="causal-survival-analysis.html#cb163-13" tabindex="-1"></a>gf.qsmk1<span class="sc">$</span>p.noevent1 <span class="ot">&lt;-</span> <span class="fu">predict</span>(gf.model, gf.qsmk1, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb163-14"><a href="causal-survival-analysis.html#cb163-14" tabindex="-1"></a></span>
+<span id="cb163-15"><a href="causal-survival-analysis.html#cb163-15" tabindex="-1"></a><span class="co">#install.packages(&quot;dplyr&quot;)</span></span>
+<span id="cb163-16"><a href="causal-survival-analysis.html#cb163-16" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;dplyr&quot;</span>)</span>
+<span id="cb163-17"><a href="causal-survival-analysis.html#cb163-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb163-18"><a href="causal-survival-analysis.html#cb163-18" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;dplyr&#39;</span></span>
+<span id="cb163-19"><a href="causal-survival-analysis.html#cb163-19" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:stats&#39;:</span></span>
+<span id="cb163-20"><a href="causal-survival-analysis.html#cb163-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb163-21"><a href="causal-survival-analysis.html#cb163-21" tabindex="-1"></a><span class="co">#&gt;     filter, lag</span></span>
+<span id="cb163-22"><a href="causal-survival-analysis.html#cb163-22" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
+<span id="cb163-23"><a href="causal-survival-analysis.html#cb163-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb163-24"><a href="causal-survival-analysis.html#cb163-24" tabindex="-1"></a><span class="co">#&gt;     intersect, setdiff, setequal, union</span></span></code></pre></div>
+<div class="sourceCode" id="cb164"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb164-1"><a href="causal-survival-analysis.html#cb164-1" tabindex="-1"></a>gf.qsmk0.surv <span class="ot">&lt;-</span> gf.qsmk0 <span class="sc">%&gt;%</span> <span class="fu">group_by</span>(seqn) <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">surv0 =</span> <span class="fu">cumprod</span>(p.noevent0))</span>
+<span id="cb164-2"><a href="causal-survival-analysis.html#cb164-2" tabindex="-1"></a>gf.qsmk1.surv <span class="ot">&lt;-</span> gf.qsmk1 <span class="sc">%&gt;%</span> <span class="fu">group_by</span>(seqn) <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">surv1 =</span> <span class="fu">cumprod</span>(p.noevent1))</span>
+<span id="cb164-3"><a href="causal-survival-analysis.html#cb164-3" tabindex="-1"></a></span>
+<span id="cb164-4"><a href="causal-survival-analysis.html#cb164-4" tabindex="-1"></a>gf.surv0 <span class="ot">&lt;-</span></span>
+<span id="cb164-5"><a href="causal-survival-analysis.html#cb164-5" tabindex="-1"></a>  <span class="fu">aggregate</span>(gf.qsmk0.surv,</span>
+<span id="cb164-6"><a href="causal-survival-analysis.html#cb164-6" tabindex="-1"></a>            <span class="at">by =</span> <span class="fu">list</span>(gf.qsmk0.surv<span class="sc">$</span>time),</span>
+<span id="cb164-7"><a href="causal-survival-analysis.html#cb164-7" tabindex="-1"></a>            <span class="at">FUN =</span> mean)[<span class="fu">c</span>(<span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;time&quot;</span>, <span class="st">&quot;surv0&quot;</span>)]</span>
+<span id="cb164-8"><a href="causal-survival-analysis.html#cb164-8" tabindex="-1"></a>gf.surv1 <span class="ot">&lt;-</span></span>
+<span id="cb164-9"><a href="causal-survival-analysis.html#cb164-9" tabindex="-1"></a>  <span class="fu">aggregate</span>(gf.qsmk1.surv,</span>
+<span id="cb164-10"><a href="causal-survival-analysis.html#cb164-10" tabindex="-1"></a>            <span class="at">by =</span> <span class="fu">list</span>(gf.qsmk1.surv<span class="sc">$</span>time),</span>
+<span id="cb164-11"><a href="causal-survival-analysis.html#cb164-11" tabindex="-1"></a>            <span class="at">FUN =</span> mean)[<span class="fu">c</span>(<span class="st">&quot;qsmk&quot;</span>, <span class="st">&quot;time&quot;</span>, <span class="st">&quot;surv1&quot;</span>)]</span>
+<span id="cb164-12"><a href="causal-survival-analysis.html#cb164-12" tabindex="-1"></a></span>
+<span id="cb164-13"><a href="causal-survival-analysis.html#cb164-13" tabindex="-1"></a>gf.graph <span class="ot">&lt;-</span> <span class="fu">merge</span>(gf.surv0, gf.surv1, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;time&quot;</span>))</span>
+<span id="cb164-14"><a href="causal-survival-analysis.html#cb164-14" tabindex="-1"></a>gf.graph<span class="sc">$</span>survdiff <span class="ot">&lt;-</span> gf.graph<span class="sc">$</span>surv1<span class="sc">-</span>gf.graph<span class="sc">$</span>surv0</span>
+<span id="cb164-15"><a href="causal-survival-analysis.html#cb164-15" tabindex="-1"></a></span>
+<span id="cb164-16"><a href="causal-survival-analysis.html#cb164-16" tabindex="-1"></a><span class="co"># plot</span></span>
+<span id="cb164-17"><a href="causal-survival-analysis.html#cb164-17" tabindex="-1"></a><span class="fu">ggplot</span>(gf.graph, <span class="fu">aes</span>(<span class="at">x=</span>time, <span class="at">y=</span>surv)) <span class="sc">+</span></span>
+<span id="cb164-18"><a href="causal-survival-analysis.html#cb164-18" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv0, <span class="at">colour =</span> <span class="st">&quot;0&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb164-19"><a href="causal-survival-analysis.html#cb164-19" tabindex="-1"></a>  <span class="fu">geom_line</span>(<span class="fu">aes</span>(<span class="at">y =</span> surv1, <span class="at">colour =</span> <span class="st">&quot;1&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb164-20"><a href="causal-survival-analysis.html#cb164-20" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Months&quot;</span>) <span class="sc">+</span></span>
+<span id="cb164-21"><a href="causal-survival-analysis.html#cb164-21" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">limits =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">120</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">120</span>,<span class="dv">12</span>)) <span class="sc">+</span></span>
+<span id="cb164-22"><a href="causal-survival-analysis.html#cb164-22" tabindex="-1"></a>  <span class="fu">scale_y_continuous</span>(<span class="at">limits=</span><span class="fu">c</span>(<span class="fl">0.6</span>, <span class="dv">1</span>), <span class="at">breaks=</span><span class="fu">seq</span>(<span class="fl">0.6</span>, <span class="dv">1</span>, <span class="fl">0.2</span>)) <span class="sc">+</span></span>
+<span id="cb164-23"><a href="causal-survival-analysis.html#cb164-23" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Survival&quot;</span>) <span class="sc">+</span></span>
+<span id="cb164-24"><a href="causal-survival-analysis.html#cb164-24" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&quot;Survival from g-formula&quot;</span>) <span class="sc">+</span></span>
+<span id="cb164-25"><a href="causal-survival-analysis.html#cb164-25" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">colour=</span><span class="st">&quot;A:&quot;</span>) <span class="sc">+</span></span>
+<span id="cb164-26"><a href="causal-survival-analysis.html#cb164-26" tabindex="-1"></a>  <span class="fu">theme_bw</span>() <span class="sc">+</span></span>
+<span id="cb164-27"><a href="causal-survival-analysis.html#cb164-27" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position=</span><span class="st">&quot;bottom&quot;</span>)</span></code></pre></div>
 <p><img src="17-causal-surv-r_files/figure-html/unnamed-chunk-5-1.png" width="85%" style="display: block; margin: auto;" /></p>
 </div>
 <div id="program-17.5" class="section level2 hasAnchor">
@@ -652,147 +652,147 @@ <h2>Program 17.5<a href="causal-survival-analysis.html#program-17.5" class="anch
 <li>Estimating of median survival time ratio via a structural nested AFT model</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb48"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb48-1"><a href="causal-survival-analysis.html#cb48-1" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
-<span id="cb48-2"><a href="causal-survival-analysis.html#cb48-2" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb48-3"><a href="causal-survival-analysis.html#cb48-3" tabindex="-1"></a>nhefs<span class="sc">$</span>survtime <span class="ot">&lt;-</span></span>
-<span id="cb48-4"><a href="causal-survival-analysis.html#cb48-4" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>death <span class="sc">==</span> <span class="dv">0</span>, <span class="cn">NA</span>, (nhefs<span class="sc">$</span>yrdth <span class="sc">-</span> <span class="dv">83</span>) <span class="sc">*</span> <span class="dv">12</span> <span class="sc">+</span> nhefs<span class="sc">$</span>modth)</span>
-<span id="cb48-5"><a href="causal-survival-analysis.html#cb48-5" tabindex="-1"></a>  <span class="co"># * yrdth ranges from 83 to 92</span></span>
-<span id="cb48-6"><a href="causal-survival-analysis.html#cb48-6" tabindex="-1"></a></span>
-<span id="cb48-7"><a href="causal-survival-analysis.html#cb48-7" tabindex="-1"></a><span class="co"># model to estimate E[A|L]</span></span>
-<span id="cb48-8"><a href="causal-survival-analysis.html#cb48-8" tabindex="-1"></a>modelA <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
-<span id="cb48-9"><a href="causal-survival-analysis.html#cb48-9" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
-<span id="cb48-10"><a href="causal-survival-analysis.html#cb48-10" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb48-11"><a href="causal-survival-analysis.html#cb48-11" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb48-12"><a href="causal-survival-analysis.html#cb48-12" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
-<span id="cb48-13"><a href="causal-survival-analysis.html#cb48-13" tabindex="-1"></a>              <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb48-14"><a href="causal-survival-analysis.html#cb48-14" tabindex="-1"></a></span>
-<span id="cb48-15"><a href="causal-survival-analysis.html#cb48-15" tabindex="-1"></a>nhefs<span class="sc">$</span>p.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(modelA, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb48-16"><a href="causal-survival-analysis.html#cb48-16" tabindex="-1"></a>d <span class="ot">&lt;-</span> nhefs[<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>survtime),] <span class="co"># select only those with observed death time</span></span>
-<span id="cb48-17"><a href="causal-survival-analysis.html#cb48-17" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">nrow</span>(d)</span>
-<span id="cb48-18"><a href="causal-survival-analysis.html#cb48-18" tabindex="-1"></a></span>
-<span id="cb48-19"><a href="causal-survival-analysis.html#cb48-19" tabindex="-1"></a><span class="co"># define the estimating function that needs to be minimized</span></span>
-<span id="cb48-20"><a href="causal-survival-analysis.html#cb48-20" tabindex="-1"></a>sumeef <span class="ot">&lt;-</span> <span class="cf">function</span>(psi){</span>
-<span id="cb48-21"><a href="causal-survival-analysis.html#cb48-21" tabindex="-1"></a></span>
-<span id="cb48-22"><a href="causal-survival-analysis.html#cb48-22" tabindex="-1"></a>  <span class="co"># creation of delta indicator</span></span>
-<span id="cb48-23"><a href="causal-survival-analysis.html#cb48-23" tabindex="-1"></a>  <span class="cf">if</span> (psi<span class="sc">&gt;=</span><span class="dv">0</span>){</span>
-<span id="cb48-24"><a href="causal-survival-analysis.html#cb48-24" tabindex="-1"></a>    delta <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span> <span class="sc">|</span></span>
-<span id="cb48-25"><a href="causal-survival-analysis.html#cb48-25" tabindex="-1"></a>                      (d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span> <span class="sc">&amp;</span> psi <span class="sc">&lt;=</span> <span class="fu">log</span>(<span class="dv">120</span><span class="sc">/</span>d<span class="sc">$</span>survtime)),</span>
-<span id="cb48-26"><a href="causal-survival-analysis.html#cb48-26" tabindex="-1"></a>                    <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb48-27"><a href="causal-survival-analysis.html#cb48-27" tabindex="-1"></a>  } <span class="cf">else</span> <span class="cf">if</span> (psi <span class="sc">&lt;</span> <span class="dv">0</span>) {</span>
-<span id="cb48-28"><a href="causal-survival-analysis.html#cb48-28" tabindex="-1"></a>    delta <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span> <span class="sc">|</span></span>
-<span id="cb48-29"><a href="causal-survival-analysis.html#cb48-29" tabindex="-1"></a>                      (d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span> <span class="sc">&amp;</span> psi <span class="sc">&gt;</span> <span class="fu">log</span>(d<span class="sc">$</span>survtime<span class="sc">/</span><span class="dv">120</span>)), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb48-30"><a href="causal-survival-analysis.html#cb48-30" tabindex="-1"></a>  }</span>
-<span id="cb48-31"><a href="causal-survival-analysis.html#cb48-31" tabindex="-1"></a></span>
-<span id="cb48-32"><a href="causal-survival-analysis.html#cb48-32" tabindex="-1"></a>  smat <span class="ot">&lt;-</span> delta<span class="sc">*</span>(d<span class="sc">$</span>qsmk<span class="sc">-</span>d<span class="sc">$</span>p.qsmk)</span>
-<span id="cb48-33"><a href="causal-survival-analysis.html#cb48-33" tabindex="-1"></a>  sval <span class="ot">&lt;-</span> <span class="fu">sum</span>(smat, <span class="at">na.rm=</span>T)</span>
-<span id="cb48-34"><a href="causal-survival-analysis.html#cb48-34" tabindex="-1"></a>  save <span class="ot">&lt;-</span> sval<span class="sc">/</span>n</span>
-<span id="cb48-35"><a href="causal-survival-analysis.html#cb48-35" tabindex="-1"></a>  smat <span class="ot">&lt;-</span> smat <span class="sc">-</span> <span class="fu">rep</span>(save, n)</span>
-<span id="cb48-36"><a href="causal-survival-analysis.html#cb48-36" tabindex="-1"></a></span>
-<span id="cb48-37"><a href="causal-survival-analysis.html#cb48-37" tabindex="-1"></a>  <span class="co"># covariance</span></span>
-<span id="cb48-38"><a href="causal-survival-analysis.html#cb48-38" tabindex="-1"></a>  sigma <span class="ot">&lt;-</span> <span class="fu">t</span>(smat) <span class="sc">%*%</span> smat</span>
-<span id="cb48-39"><a href="causal-survival-analysis.html#cb48-39" tabindex="-1"></a>  <span class="cf">if</span> (sigma <span class="sc">==</span> <span class="dv">0</span>){</span>
-<span id="cb48-40"><a href="causal-survival-analysis.html#cb48-40" tabindex="-1"></a>    sigma <span class="ot">&lt;-</span> <span class="fl">1e-16</span></span>
-<span id="cb48-41"><a href="causal-survival-analysis.html#cb48-41" tabindex="-1"></a>  }</span>
-<span id="cb48-42"><a href="causal-survival-analysis.html#cb48-42" tabindex="-1"></a>  estimeq <span class="ot">&lt;-</span> sval<span class="sc">*</span><span class="fu">solve</span>(sigma)<span class="sc">*</span><span class="fu">t</span>(sval)</span>
-<span id="cb48-43"><a href="causal-survival-analysis.html#cb48-43" tabindex="-1"></a>  <span class="fu">return</span>(estimeq)</span>
-<span id="cb48-44"><a href="causal-survival-analysis.html#cb48-44" tabindex="-1"></a>}</span>
-<span id="cb48-45"><a href="causal-survival-analysis.html#cb48-45" tabindex="-1"></a></span>
-<span id="cb48-46"><a href="causal-survival-analysis.html#cb48-46" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">optimize</span>(sumeef, <span class="at">interval =</span> <span class="fu">c</span>(<span class="sc">-</span><span class="fl">0.2</span>,<span class="fl">0.2</span>))</span>
-<span id="cb48-47"><a href="causal-survival-analysis.html#cb48-47" tabindex="-1"></a>psi1 <span class="ot">&lt;-</span> res<span class="sc">$</span>minimum</span>
-<span id="cb48-48"><a href="causal-survival-analysis.html#cb48-48" tabindex="-1"></a>objfunc <span class="ot">&lt;-</span> <span class="fu">as.numeric</span>(res<span class="sc">$</span>objective)</span>
-<span id="cb48-49"><a href="causal-survival-analysis.html#cb48-49" tabindex="-1"></a></span>
-<span id="cb48-50"><a href="causal-survival-analysis.html#cb48-50" tabindex="-1"></a></span>
-<span id="cb48-51"><a href="causal-survival-analysis.html#cb48-51" tabindex="-1"></a><span class="co"># Use simple bisection method to find estimates of lower and upper 95% confidence bounds</span></span>
-<span id="cb48-52"><a href="causal-survival-analysis.html#cb48-52" tabindex="-1"></a>increm <span class="ot">&lt;-</span> <span class="fl">0.1</span></span>
-<span id="cb48-53"><a href="causal-survival-analysis.html#cb48-53" tabindex="-1"></a>for_conf <span class="ot">&lt;-</span> <span class="cf">function</span>(x){</span>
-<span id="cb48-54"><a href="causal-survival-analysis.html#cb48-54" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">sumeef</span>(x) <span class="sc">-</span> <span class="fl">3.84</span>)</span>
-<span id="cb48-55"><a href="causal-survival-analysis.html#cb48-55" tabindex="-1"></a>}</span>
-<span id="cb48-56"><a href="causal-survival-analysis.html#cb48-56" tabindex="-1"></a></span>
-<span id="cb48-57"><a href="causal-survival-analysis.html#cb48-57" tabindex="-1"></a><span class="cf">if</span> (objfunc <span class="sc">&lt;</span> <span class="fl">3.84</span>){</span>
-<span id="cb48-58"><a href="causal-survival-analysis.html#cb48-58" tabindex="-1"></a>  <span class="co"># Find estimate of where sumeef(x) &gt; 3.84</span></span>
-<span id="cb48-59"><a href="causal-survival-analysis.html#cb48-59" tabindex="-1"></a></span>
-<span id="cb48-60"><a href="causal-survival-analysis.html#cb48-60" tabindex="-1"></a>  <span class="co"># Lower bound of 95% CI</span></span>
-<span id="cb48-61"><a href="causal-survival-analysis.html#cb48-61" tabindex="-1"></a>  psilow <span class="ot">&lt;-</span> psi1</span>
-<span id="cb48-62"><a href="causal-survival-analysis.html#cb48-62" tabindex="-1"></a>  testlow <span class="ot">&lt;-</span> objfunc</span>
-<span id="cb48-63"><a href="causal-survival-analysis.html#cb48-63" tabindex="-1"></a>  countlow <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb48-64"><a href="causal-survival-analysis.html#cb48-64" tabindex="-1"></a>  <span class="cf">while</span> (testlow <span class="sc">&lt;</span> <span class="fl">3.84</span> <span class="sc">&amp;</span> countlow <span class="sc">&lt;</span> <span class="dv">100</span>){</span>
-<span id="cb48-65"><a href="causal-survival-analysis.html#cb48-65" tabindex="-1"></a>    psilow <span class="ot">&lt;-</span> psilow <span class="sc">-</span> increm</span>
-<span id="cb48-66"><a href="causal-survival-analysis.html#cb48-66" tabindex="-1"></a>    testlow <span class="ot">&lt;-</span> <span class="fu">sumeef</span>(psilow)</span>
-<span id="cb48-67"><a href="causal-survival-analysis.html#cb48-67" tabindex="-1"></a>    countlow <span class="ot">&lt;-</span> countlow <span class="sc">+</span> <span class="dv">1</span></span>
-<span id="cb48-68"><a href="causal-survival-analysis.html#cb48-68" tabindex="-1"></a>  }</span>
-<span id="cb48-69"><a href="causal-survival-analysis.html#cb48-69" tabindex="-1"></a></span>
-<span id="cb48-70"><a href="causal-survival-analysis.html#cb48-70" tabindex="-1"></a>  <span class="co"># Upper bound of 95% CI</span></span>
-<span id="cb48-71"><a href="causal-survival-analysis.html#cb48-71" tabindex="-1"></a>  psihigh <span class="ot">&lt;-</span> psi1</span>
-<span id="cb48-72"><a href="causal-survival-analysis.html#cb48-72" tabindex="-1"></a>  testhigh <span class="ot">&lt;-</span> objfunc</span>
-<span id="cb48-73"><a href="causal-survival-analysis.html#cb48-73" tabindex="-1"></a>  counthigh <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb48-74"><a href="causal-survival-analysis.html#cb48-74" tabindex="-1"></a>  <span class="cf">while</span> (testhigh <span class="sc">&lt;</span> <span class="fl">3.84</span> <span class="sc">&amp;</span> counthigh <span class="sc">&lt;</span> <span class="dv">100</span>){</span>
-<span id="cb48-75"><a href="causal-survival-analysis.html#cb48-75" tabindex="-1"></a>    psihigh <span class="ot">&lt;-</span> psihigh <span class="sc">+</span> increm</span>
-<span id="cb48-76"><a href="causal-survival-analysis.html#cb48-76" tabindex="-1"></a>    testhigh <span class="ot">&lt;-</span> <span class="fu">sumeef</span>(psihigh)</span>
-<span id="cb48-77"><a href="causal-survival-analysis.html#cb48-77" tabindex="-1"></a>    counthigh <span class="ot">&lt;-</span> counthigh <span class="sc">+</span> <span class="dv">1</span></span>
-<span id="cb48-78"><a href="causal-survival-analysis.html#cb48-78" tabindex="-1"></a>  }</span>
-<span id="cb48-79"><a href="causal-survival-analysis.html#cb48-79" tabindex="-1"></a></span>
-<span id="cb48-80"><a href="causal-survival-analysis.html#cb48-80" tabindex="-1"></a>  <span class="co"># Better estimate using bisection method</span></span>
-<span id="cb48-81"><a href="causal-survival-analysis.html#cb48-81" tabindex="-1"></a>  <span class="cf">if</span> ((testhigh <span class="sc">&gt;</span> <span class="fl">3.84</span>) <span class="sc">&amp;</span> (testlow <span class="sc">&gt;</span> <span class="fl">3.84</span>)){</span>
-<span id="cb48-82"><a href="causal-survival-analysis.html#cb48-82" tabindex="-1"></a></span>
-<span id="cb48-83"><a href="causal-survival-analysis.html#cb48-83" tabindex="-1"></a>    <span class="co"># Bisection method</span></span>
-<span id="cb48-84"><a href="causal-survival-analysis.html#cb48-84" tabindex="-1"></a>    left <span class="ot">&lt;-</span> psi1</span>
-<span id="cb48-85"><a href="causal-survival-analysis.html#cb48-85" tabindex="-1"></a>    fleft <span class="ot">&lt;-</span> objfunc <span class="sc">-</span> <span class="fl">3.84</span></span>
-<span id="cb48-86"><a href="causal-survival-analysis.html#cb48-86" tabindex="-1"></a>    right <span class="ot">&lt;-</span> psihigh</span>
-<span id="cb48-87"><a href="causal-survival-analysis.html#cb48-87" tabindex="-1"></a>    fright <span class="ot">&lt;-</span> testhigh <span class="sc">-</span> <span class="fl">3.84</span></span>
-<span id="cb48-88"><a href="causal-survival-analysis.html#cb48-88" tabindex="-1"></a>    middle <span class="ot">&lt;-</span> (left  <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
-<span id="cb48-89"><a href="causal-survival-analysis.html#cb48-89" tabindex="-1"></a>    fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
-<span id="cb48-90"><a href="causal-survival-analysis.html#cb48-90" tabindex="-1"></a>    count <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb48-91"><a href="causal-survival-analysis.html#cb48-91" tabindex="-1"></a>    diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
-<span id="cb48-92"><a href="causal-survival-analysis.html#cb48-92" tabindex="-1"></a></span>
-<span id="cb48-93"><a href="causal-survival-analysis.html#cb48-93" tabindex="-1"></a>    <span class="cf">while</span> (<span class="sc">!</span>(<span class="fu">abs</span>(fmiddle) <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> diff <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> count <span class="sc">&gt;</span> <span class="dv">100</span>)){</span>
-<span id="cb48-94"><a href="causal-survival-analysis.html#cb48-94" tabindex="-1"></a>      test <span class="ot">&lt;-</span> fmiddle <span class="sc">*</span> fleft</span>
-<span id="cb48-95"><a href="causal-survival-analysis.html#cb48-95" tabindex="-1"></a>      <span class="cf">if</span> (test <span class="sc">&lt;</span> <span class="dv">0</span>){</span>
-<span id="cb48-96"><a href="causal-survival-analysis.html#cb48-96" tabindex="-1"></a>        right <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-97"><a href="causal-survival-analysis.html#cb48-97" tabindex="-1"></a>        fright <span class="ot">&lt;-</span> fmiddle</span>
-<span id="cb48-98"><a href="causal-survival-analysis.html#cb48-98" tabindex="-1"></a>      } <span class="cf">else</span> {</span>
-<span id="cb48-99"><a href="causal-survival-analysis.html#cb48-99" tabindex="-1"></a>        left <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-100"><a href="causal-survival-analysis.html#cb48-100" tabindex="-1"></a>        fleft <span class="ot">&lt;-</span> fmiddle</span>
-<span id="cb48-101"><a href="causal-survival-analysis.html#cb48-101" tabindex="-1"></a>      }</span>
-<span id="cb48-102"><a href="causal-survival-analysis.html#cb48-102" tabindex="-1"></a>      middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
-<span id="cb48-103"><a href="causal-survival-analysis.html#cb48-103" tabindex="-1"></a>      fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
-<span id="cb48-104"><a href="causal-survival-analysis.html#cb48-104" tabindex="-1"></a>      count <span class="ot">&lt;-</span> count <span class="sc">+</span> <span class="dv">1</span></span>
-<span id="cb48-105"><a href="causal-survival-analysis.html#cb48-105" tabindex="-1"></a>      diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
-<span id="cb48-106"><a href="causal-survival-analysis.html#cb48-106" tabindex="-1"></a>    }</span>
-<span id="cb48-107"><a href="causal-survival-analysis.html#cb48-107" tabindex="-1"></a></span>
-<span id="cb48-108"><a href="causal-survival-analysis.html#cb48-108" tabindex="-1"></a>    psi_high <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-109"><a href="causal-survival-analysis.html#cb48-109" tabindex="-1"></a>    objfunc_high <span class="ot">&lt;-</span> fmiddle <span class="sc">+</span> <span class="fl">3.84</span></span>
-<span id="cb48-110"><a href="causal-survival-analysis.html#cb48-110" tabindex="-1"></a></span>
-<span id="cb48-111"><a href="causal-survival-analysis.html#cb48-111" tabindex="-1"></a>    <span class="co"># lower bound of 95% CI</span></span>
-<span id="cb48-112"><a href="causal-survival-analysis.html#cb48-112" tabindex="-1"></a>    left <span class="ot">&lt;-</span> psilow</span>
-<span id="cb48-113"><a href="causal-survival-analysis.html#cb48-113" tabindex="-1"></a>    fleft <span class="ot">&lt;-</span> testlow <span class="sc">-</span> <span class="fl">3.84</span></span>
-<span id="cb48-114"><a href="causal-survival-analysis.html#cb48-114" tabindex="-1"></a>    right <span class="ot">&lt;-</span> psi1</span>
-<span id="cb48-115"><a href="causal-survival-analysis.html#cb48-115" tabindex="-1"></a>    fright <span class="ot">&lt;-</span> objfunc <span class="sc">-</span> <span class="fl">3.84</span></span>
-<span id="cb48-116"><a href="causal-survival-analysis.html#cb48-116" tabindex="-1"></a>    middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
-<span id="cb48-117"><a href="causal-survival-analysis.html#cb48-117" tabindex="-1"></a>    fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
-<span id="cb48-118"><a href="causal-survival-analysis.html#cb48-118" tabindex="-1"></a>    count <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb48-119"><a href="causal-survival-analysis.html#cb48-119" tabindex="-1"></a>    diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
-<span id="cb48-120"><a href="causal-survival-analysis.html#cb48-120" tabindex="-1"></a></span>
-<span id="cb48-121"><a href="causal-survival-analysis.html#cb48-121" tabindex="-1"></a>    <span class="cf">while</span>(<span class="sc">!</span>(<span class="fu">abs</span>(fmiddle) <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> diff <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> count <span class="sc">&gt;</span> <span class="dv">100</span>)){</span>
-<span id="cb48-122"><a href="causal-survival-analysis.html#cb48-122" tabindex="-1"></a>      test <span class="ot">&lt;-</span> fmiddle <span class="sc">*</span> fleft</span>
-<span id="cb48-123"><a href="causal-survival-analysis.html#cb48-123" tabindex="-1"></a>      <span class="cf">if</span> (test <span class="sc">&lt;</span> <span class="dv">0</span>){</span>
-<span id="cb48-124"><a href="causal-survival-analysis.html#cb48-124" tabindex="-1"></a>        right <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-125"><a href="causal-survival-analysis.html#cb48-125" tabindex="-1"></a>        fright <span class="ot">&lt;-</span> fmiddle</span>
-<span id="cb48-126"><a href="causal-survival-analysis.html#cb48-126" tabindex="-1"></a>      } <span class="cf">else</span> {</span>
-<span id="cb48-127"><a href="causal-survival-analysis.html#cb48-127" tabindex="-1"></a>        left <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-128"><a href="causal-survival-analysis.html#cb48-128" tabindex="-1"></a>        fleft <span class="ot">&lt;-</span> fmiddle</span>
-<span id="cb48-129"><a href="causal-survival-analysis.html#cb48-129" tabindex="-1"></a>      }</span>
-<span id="cb48-130"><a href="causal-survival-analysis.html#cb48-130" tabindex="-1"></a>      middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
-<span id="cb48-131"><a href="causal-survival-analysis.html#cb48-131" tabindex="-1"></a>      fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
-<span id="cb48-132"><a href="causal-survival-analysis.html#cb48-132" tabindex="-1"></a>      diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
-<span id="cb48-133"><a href="causal-survival-analysis.html#cb48-133" tabindex="-1"></a>      count <span class="ot">&lt;-</span> count <span class="sc">+</span> <span class="dv">1</span></span>
-<span id="cb48-134"><a href="causal-survival-analysis.html#cb48-134" tabindex="-1"></a>    }</span>
-<span id="cb48-135"><a href="causal-survival-analysis.html#cb48-135" tabindex="-1"></a>    psi_low <span class="ot">&lt;-</span> middle</span>
-<span id="cb48-136"><a href="causal-survival-analysis.html#cb48-136" tabindex="-1"></a>    objfunc_low <span class="ot">&lt;-</span> fmiddle <span class="sc">+</span> <span class="fl">3.84</span></span>
-<span id="cb48-137"><a href="causal-survival-analysis.html#cb48-137" tabindex="-1"></a>    psi <span class="ot">&lt;-</span> psi1</span>
-<span id="cb48-138"><a href="causal-survival-analysis.html#cb48-138" tabindex="-1"></a>  }</span>
-<span id="cb48-139"><a href="causal-survival-analysis.html#cb48-139" tabindex="-1"></a>}</span>
-<span id="cb48-140"><a href="causal-survival-analysis.html#cb48-140" tabindex="-1"></a><span class="fu">c</span>(psi, psi_low, psi_high)</span>
-<span id="cb48-141"><a href="causal-survival-analysis.html#cb48-141" tabindex="-1"></a><span class="co">#&gt; [1] -0.05041591 -0.22312099  0.33312901</span></span></code></pre></div>
+<div class="sourceCode" id="cb165"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb165-1"><a href="causal-survival-analysis.html#cb165-1" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
+<span id="cb165-2"><a href="causal-survival-analysis.html#cb165-2" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb165-3"><a href="causal-survival-analysis.html#cb165-3" tabindex="-1"></a>nhefs<span class="sc">$</span>survtime <span class="ot">&lt;-</span></span>
+<span id="cb165-4"><a href="causal-survival-analysis.html#cb165-4" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>death <span class="sc">==</span> <span class="dv">0</span>, <span class="cn">NA</span>, (nhefs<span class="sc">$</span>yrdth <span class="sc">-</span> <span class="dv">83</span>) <span class="sc">*</span> <span class="dv">12</span> <span class="sc">+</span> nhefs<span class="sc">$</span>modth)</span>
+<span id="cb165-5"><a href="causal-survival-analysis.html#cb165-5" tabindex="-1"></a>  <span class="co"># * yrdth ranges from 83 to 92</span></span>
+<span id="cb165-6"><a href="causal-survival-analysis.html#cb165-6" tabindex="-1"></a></span>
+<span id="cb165-7"><a href="causal-survival-analysis.html#cb165-7" tabindex="-1"></a><span class="co"># model to estimate E[A|L]</span></span>
+<span id="cb165-8"><a href="causal-survival-analysis.html#cb165-8" tabindex="-1"></a>modelA <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
+<span id="cb165-9"><a href="causal-survival-analysis.html#cb165-9" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
+<span id="cb165-10"><a href="causal-survival-analysis.html#cb165-10" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb165-11"><a href="causal-survival-analysis.html#cb165-11" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb165-12"><a href="causal-survival-analysis.html#cb165-12" tabindex="-1"></a>              <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
+<span id="cb165-13"><a href="causal-survival-analysis.html#cb165-13" tabindex="-1"></a>              <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb165-14"><a href="causal-survival-analysis.html#cb165-14" tabindex="-1"></a></span>
+<span id="cb165-15"><a href="causal-survival-analysis.html#cb165-15" tabindex="-1"></a>nhefs<span class="sc">$</span>p.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(modelA, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb165-16"><a href="causal-survival-analysis.html#cb165-16" tabindex="-1"></a>d <span class="ot">&lt;-</span> nhefs[<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>survtime),] <span class="co"># select only those with observed death time</span></span>
+<span id="cb165-17"><a href="causal-survival-analysis.html#cb165-17" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">nrow</span>(d)</span>
+<span id="cb165-18"><a href="causal-survival-analysis.html#cb165-18" tabindex="-1"></a></span>
+<span id="cb165-19"><a href="causal-survival-analysis.html#cb165-19" tabindex="-1"></a><span class="co"># define the estimating function that needs to be minimized</span></span>
+<span id="cb165-20"><a href="causal-survival-analysis.html#cb165-20" tabindex="-1"></a>sumeef <span class="ot">&lt;-</span> <span class="cf">function</span>(psi){</span>
+<span id="cb165-21"><a href="causal-survival-analysis.html#cb165-21" tabindex="-1"></a></span>
+<span id="cb165-22"><a href="causal-survival-analysis.html#cb165-22" tabindex="-1"></a>  <span class="co"># creation of delta indicator</span></span>
+<span id="cb165-23"><a href="causal-survival-analysis.html#cb165-23" tabindex="-1"></a>  <span class="cf">if</span> (psi<span class="sc">&gt;=</span><span class="dv">0</span>){</span>
+<span id="cb165-24"><a href="causal-survival-analysis.html#cb165-24" tabindex="-1"></a>    delta <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span> <span class="sc">|</span></span>
+<span id="cb165-25"><a href="causal-survival-analysis.html#cb165-25" tabindex="-1"></a>                      (d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span> <span class="sc">&amp;</span> psi <span class="sc">&lt;=</span> <span class="fu">log</span>(<span class="dv">120</span><span class="sc">/</span>d<span class="sc">$</span>survtime)),</span>
+<span id="cb165-26"><a href="causal-survival-analysis.html#cb165-26" tabindex="-1"></a>                    <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb165-27"><a href="causal-survival-analysis.html#cb165-27" tabindex="-1"></a>  } <span class="cf">else</span> <span class="cf">if</span> (psi <span class="sc">&lt;</span> <span class="dv">0</span>) {</span>
+<span id="cb165-28"><a href="causal-survival-analysis.html#cb165-28" tabindex="-1"></a>    delta <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span> <span class="sc">|</span></span>
+<span id="cb165-29"><a href="causal-survival-analysis.html#cb165-29" tabindex="-1"></a>                      (d<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span> <span class="sc">&amp;</span> psi <span class="sc">&gt;</span> <span class="fu">log</span>(d<span class="sc">$</span>survtime<span class="sc">/</span><span class="dv">120</span>)), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb165-30"><a href="causal-survival-analysis.html#cb165-30" tabindex="-1"></a>  }</span>
+<span id="cb165-31"><a href="causal-survival-analysis.html#cb165-31" tabindex="-1"></a></span>
+<span id="cb165-32"><a href="causal-survival-analysis.html#cb165-32" tabindex="-1"></a>  smat <span class="ot">&lt;-</span> delta<span class="sc">*</span>(d<span class="sc">$</span>qsmk<span class="sc">-</span>d<span class="sc">$</span>p.qsmk)</span>
+<span id="cb165-33"><a href="causal-survival-analysis.html#cb165-33" tabindex="-1"></a>  sval <span class="ot">&lt;-</span> <span class="fu">sum</span>(smat, <span class="at">na.rm=</span>T)</span>
+<span id="cb165-34"><a href="causal-survival-analysis.html#cb165-34" tabindex="-1"></a>  save <span class="ot">&lt;-</span> sval<span class="sc">/</span>n</span>
+<span id="cb165-35"><a href="causal-survival-analysis.html#cb165-35" tabindex="-1"></a>  smat <span class="ot">&lt;-</span> smat <span class="sc">-</span> <span class="fu">rep</span>(save, n)</span>
+<span id="cb165-36"><a href="causal-survival-analysis.html#cb165-36" tabindex="-1"></a></span>
+<span id="cb165-37"><a href="causal-survival-analysis.html#cb165-37" tabindex="-1"></a>  <span class="co"># covariance</span></span>
+<span id="cb165-38"><a href="causal-survival-analysis.html#cb165-38" tabindex="-1"></a>  sigma <span class="ot">&lt;-</span> <span class="fu">t</span>(smat) <span class="sc">%*%</span> smat</span>
+<span id="cb165-39"><a href="causal-survival-analysis.html#cb165-39" tabindex="-1"></a>  <span class="cf">if</span> (sigma <span class="sc">==</span> <span class="dv">0</span>){</span>
+<span id="cb165-40"><a href="causal-survival-analysis.html#cb165-40" tabindex="-1"></a>    sigma <span class="ot">&lt;-</span> <span class="fl">1e-16</span></span>
+<span id="cb165-41"><a href="causal-survival-analysis.html#cb165-41" tabindex="-1"></a>  }</span>
+<span id="cb165-42"><a href="causal-survival-analysis.html#cb165-42" tabindex="-1"></a>  estimeq <span class="ot">&lt;-</span> sval<span class="sc">*</span><span class="fu">solve</span>(sigma)<span class="sc">*</span><span class="fu">t</span>(sval)</span>
+<span id="cb165-43"><a href="causal-survival-analysis.html#cb165-43" tabindex="-1"></a>  <span class="fu">return</span>(estimeq)</span>
+<span id="cb165-44"><a href="causal-survival-analysis.html#cb165-44" tabindex="-1"></a>}</span>
+<span id="cb165-45"><a href="causal-survival-analysis.html#cb165-45" tabindex="-1"></a></span>
+<span id="cb165-46"><a href="causal-survival-analysis.html#cb165-46" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">optimize</span>(sumeef, <span class="at">interval =</span> <span class="fu">c</span>(<span class="sc">-</span><span class="fl">0.2</span>,<span class="fl">0.2</span>))</span>
+<span id="cb165-47"><a href="causal-survival-analysis.html#cb165-47" tabindex="-1"></a>psi1 <span class="ot">&lt;-</span> res<span class="sc">$</span>minimum</span>
+<span id="cb165-48"><a href="causal-survival-analysis.html#cb165-48" tabindex="-1"></a>objfunc <span class="ot">&lt;-</span> <span class="fu">as.numeric</span>(res<span class="sc">$</span>objective)</span>
+<span id="cb165-49"><a href="causal-survival-analysis.html#cb165-49" tabindex="-1"></a></span>
+<span id="cb165-50"><a href="causal-survival-analysis.html#cb165-50" tabindex="-1"></a></span>
+<span id="cb165-51"><a href="causal-survival-analysis.html#cb165-51" tabindex="-1"></a><span class="co"># Use simple bisection method to find estimates of lower and upper 95% confidence bounds</span></span>
+<span id="cb165-52"><a href="causal-survival-analysis.html#cb165-52" tabindex="-1"></a>increm <span class="ot">&lt;-</span> <span class="fl">0.1</span></span>
+<span id="cb165-53"><a href="causal-survival-analysis.html#cb165-53" tabindex="-1"></a>for_conf <span class="ot">&lt;-</span> <span class="cf">function</span>(x){</span>
+<span id="cb165-54"><a href="causal-survival-analysis.html#cb165-54" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">sumeef</span>(x) <span class="sc">-</span> <span class="fl">3.84</span>)</span>
+<span id="cb165-55"><a href="causal-survival-analysis.html#cb165-55" tabindex="-1"></a>}</span>
+<span id="cb165-56"><a href="causal-survival-analysis.html#cb165-56" tabindex="-1"></a></span>
+<span id="cb165-57"><a href="causal-survival-analysis.html#cb165-57" tabindex="-1"></a><span class="cf">if</span> (objfunc <span class="sc">&lt;</span> <span class="fl">3.84</span>){</span>
+<span id="cb165-58"><a href="causal-survival-analysis.html#cb165-58" tabindex="-1"></a>  <span class="co"># Find estimate of where sumeef(x) &gt; 3.84</span></span>
+<span id="cb165-59"><a href="causal-survival-analysis.html#cb165-59" tabindex="-1"></a></span>
+<span id="cb165-60"><a href="causal-survival-analysis.html#cb165-60" tabindex="-1"></a>  <span class="co"># Lower bound of 95% CI</span></span>
+<span id="cb165-61"><a href="causal-survival-analysis.html#cb165-61" tabindex="-1"></a>  psilow <span class="ot">&lt;-</span> psi1</span>
+<span id="cb165-62"><a href="causal-survival-analysis.html#cb165-62" tabindex="-1"></a>  testlow <span class="ot">&lt;-</span> objfunc</span>
+<span id="cb165-63"><a href="causal-survival-analysis.html#cb165-63" tabindex="-1"></a>  countlow <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb165-64"><a href="causal-survival-analysis.html#cb165-64" tabindex="-1"></a>  <span class="cf">while</span> (testlow <span class="sc">&lt;</span> <span class="fl">3.84</span> <span class="sc">&amp;</span> countlow <span class="sc">&lt;</span> <span class="dv">100</span>){</span>
+<span id="cb165-65"><a href="causal-survival-analysis.html#cb165-65" tabindex="-1"></a>    psilow <span class="ot">&lt;-</span> psilow <span class="sc">-</span> increm</span>
+<span id="cb165-66"><a href="causal-survival-analysis.html#cb165-66" tabindex="-1"></a>    testlow <span class="ot">&lt;-</span> <span class="fu">sumeef</span>(psilow)</span>
+<span id="cb165-67"><a href="causal-survival-analysis.html#cb165-67" tabindex="-1"></a>    countlow <span class="ot">&lt;-</span> countlow <span class="sc">+</span> <span class="dv">1</span></span>
+<span id="cb165-68"><a href="causal-survival-analysis.html#cb165-68" tabindex="-1"></a>  }</span>
+<span id="cb165-69"><a href="causal-survival-analysis.html#cb165-69" tabindex="-1"></a></span>
+<span id="cb165-70"><a href="causal-survival-analysis.html#cb165-70" tabindex="-1"></a>  <span class="co"># Upper bound of 95% CI</span></span>
+<span id="cb165-71"><a href="causal-survival-analysis.html#cb165-71" tabindex="-1"></a>  psihigh <span class="ot">&lt;-</span> psi1</span>
+<span id="cb165-72"><a href="causal-survival-analysis.html#cb165-72" tabindex="-1"></a>  testhigh <span class="ot">&lt;-</span> objfunc</span>
+<span id="cb165-73"><a href="causal-survival-analysis.html#cb165-73" tabindex="-1"></a>  counthigh <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb165-74"><a href="causal-survival-analysis.html#cb165-74" tabindex="-1"></a>  <span class="cf">while</span> (testhigh <span class="sc">&lt;</span> <span class="fl">3.84</span> <span class="sc">&amp;</span> counthigh <span class="sc">&lt;</span> <span class="dv">100</span>){</span>
+<span id="cb165-75"><a href="causal-survival-analysis.html#cb165-75" tabindex="-1"></a>    psihigh <span class="ot">&lt;-</span> psihigh <span class="sc">+</span> increm</span>
+<span id="cb165-76"><a href="causal-survival-analysis.html#cb165-76" tabindex="-1"></a>    testhigh <span class="ot">&lt;-</span> <span class="fu">sumeef</span>(psihigh)</span>
+<span id="cb165-77"><a href="causal-survival-analysis.html#cb165-77" tabindex="-1"></a>    counthigh <span class="ot">&lt;-</span> counthigh <span class="sc">+</span> <span class="dv">1</span></span>
+<span id="cb165-78"><a href="causal-survival-analysis.html#cb165-78" tabindex="-1"></a>  }</span>
+<span id="cb165-79"><a href="causal-survival-analysis.html#cb165-79" tabindex="-1"></a></span>
+<span id="cb165-80"><a href="causal-survival-analysis.html#cb165-80" tabindex="-1"></a>  <span class="co"># Better estimate using bisection method</span></span>
+<span id="cb165-81"><a href="causal-survival-analysis.html#cb165-81" tabindex="-1"></a>  <span class="cf">if</span> ((testhigh <span class="sc">&gt;</span> <span class="fl">3.84</span>) <span class="sc">&amp;</span> (testlow <span class="sc">&gt;</span> <span class="fl">3.84</span>)){</span>
+<span id="cb165-82"><a href="causal-survival-analysis.html#cb165-82" tabindex="-1"></a></span>
+<span id="cb165-83"><a href="causal-survival-analysis.html#cb165-83" tabindex="-1"></a>    <span class="co"># Bisection method</span></span>
+<span id="cb165-84"><a href="causal-survival-analysis.html#cb165-84" tabindex="-1"></a>    left <span class="ot">&lt;-</span> psi1</span>
+<span id="cb165-85"><a href="causal-survival-analysis.html#cb165-85" tabindex="-1"></a>    fleft <span class="ot">&lt;-</span> objfunc <span class="sc">-</span> <span class="fl">3.84</span></span>
+<span id="cb165-86"><a href="causal-survival-analysis.html#cb165-86" tabindex="-1"></a>    right <span class="ot">&lt;-</span> psihigh</span>
+<span id="cb165-87"><a href="causal-survival-analysis.html#cb165-87" tabindex="-1"></a>    fright <span class="ot">&lt;-</span> testhigh <span class="sc">-</span> <span class="fl">3.84</span></span>
+<span id="cb165-88"><a href="causal-survival-analysis.html#cb165-88" tabindex="-1"></a>    middle <span class="ot">&lt;-</span> (left  <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
+<span id="cb165-89"><a href="causal-survival-analysis.html#cb165-89" tabindex="-1"></a>    fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
+<span id="cb165-90"><a href="causal-survival-analysis.html#cb165-90" tabindex="-1"></a>    count <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb165-91"><a href="causal-survival-analysis.html#cb165-91" tabindex="-1"></a>    diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
+<span id="cb165-92"><a href="causal-survival-analysis.html#cb165-92" tabindex="-1"></a></span>
+<span id="cb165-93"><a href="causal-survival-analysis.html#cb165-93" tabindex="-1"></a>    <span class="cf">while</span> (<span class="sc">!</span>(<span class="fu">abs</span>(fmiddle) <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> diff <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> count <span class="sc">&gt;</span> <span class="dv">100</span>)){</span>
+<span id="cb165-94"><a href="causal-survival-analysis.html#cb165-94" tabindex="-1"></a>      test <span class="ot">&lt;-</span> fmiddle <span class="sc">*</span> fleft</span>
+<span id="cb165-95"><a href="causal-survival-analysis.html#cb165-95" tabindex="-1"></a>      <span class="cf">if</span> (test <span class="sc">&lt;</span> <span class="dv">0</span>){</span>
+<span id="cb165-96"><a href="causal-survival-analysis.html#cb165-96" tabindex="-1"></a>        right <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-97"><a href="causal-survival-analysis.html#cb165-97" tabindex="-1"></a>        fright <span class="ot">&lt;-</span> fmiddle</span>
+<span id="cb165-98"><a href="causal-survival-analysis.html#cb165-98" tabindex="-1"></a>      } <span class="cf">else</span> {</span>
+<span id="cb165-99"><a href="causal-survival-analysis.html#cb165-99" tabindex="-1"></a>        left <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-100"><a href="causal-survival-analysis.html#cb165-100" tabindex="-1"></a>        fleft <span class="ot">&lt;-</span> fmiddle</span>
+<span id="cb165-101"><a href="causal-survival-analysis.html#cb165-101" tabindex="-1"></a>      }</span>
+<span id="cb165-102"><a href="causal-survival-analysis.html#cb165-102" tabindex="-1"></a>      middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
+<span id="cb165-103"><a href="causal-survival-analysis.html#cb165-103" tabindex="-1"></a>      fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
+<span id="cb165-104"><a href="causal-survival-analysis.html#cb165-104" tabindex="-1"></a>      count <span class="ot">&lt;-</span> count <span class="sc">+</span> <span class="dv">1</span></span>
+<span id="cb165-105"><a href="causal-survival-analysis.html#cb165-105" tabindex="-1"></a>      diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
+<span id="cb165-106"><a href="causal-survival-analysis.html#cb165-106" tabindex="-1"></a>    }</span>
+<span id="cb165-107"><a href="causal-survival-analysis.html#cb165-107" tabindex="-1"></a></span>
+<span id="cb165-108"><a href="causal-survival-analysis.html#cb165-108" tabindex="-1"></a>    psi_high <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-109"><a href="causal-survival-analysis.html#cb165-109" tabindex="-1"></a>    objfunc_high <span class="ot">&lt;-</span> fmiddle <span class="sc">+</span> <span class="fl">3.84</span></span>
+<span id="cb165-110"><a href="causal-survival-analysis.html#cb165-110" tabindex="-1"></a></span>
+<span id="cb165-111"><a href="causal-survival-analysis.html#cb165-111" tabindex="-1"></a>    <span class="co"># lower bound of 95% CI</span></span>
+<span id="cb165-112"><a href="causal-survival-analysis.html#cb165-112" tabindex="-1"></a>    left <span class="ot">&lt;-</span> psilow</span>
+<span id="cb165-113"><a href="causal-survival-analysis.html#cb165-113" tabindex="-1"></a>    fleft <span class="ot">&lt;-</span> testlow <span class="sc">-</span> <span class="fl">3.84</span></span>
+<span id="cb165-114"><a href="causal-survival-analysis.html#cb165-114" tabindex="-1"></a>    right <span class="ot">&lt;-</span> psi1</span>
+<span id="cb165-115"><a href="causal-survival-analysis.html#cb165-115" tabindex="-1"></a>    fright <span class="ot">&lt;-</span> objfunc <span class="sc">-</span> <span class="fl">3.84</span></span>
+<span id="cb165-116"><a href="causal-survival-analysis.html#cb165-116" tabindex="-1"></a>    middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
+<span id="cb165-117"><a href="causal-survival-analysis.html#cb165-117" tabindex="-1"></a>    fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
+<span id="cb165-118"><a href="causal-survival-analysis.html#cb165-118" tabindex="-1"></a>    count <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb165-119"><a href="causal-survival-analysis.html#cb165-119" tabindex="-1"></a>    diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
+<span id="cb165-120"><a href="causal-survival-analysis.html#cb165-120" tabindex="-1"></a></span>
+<span id="cb165-121"><a href="causal-survival-analysis.html#cb165-121" tabindex="-1"></a>    <span class="cf">while</span>(<span class="sc">!</span>(<span class="fu">abs</span>(fmiddle) <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> diff <span class="sc">&lt;</span> <span class="fl">0.0001</span> <span class="sc">|</span> count <span class="sc">&gt;</span> <span class="dv">100</span>)){</span>
+<span id="cb165-122"><a href="causal-survival-analysis.html#cb165-122" tabindex="-1"></a>      test <span class="ot">&lt;-</span> fmiddle <span class="sc">*</span> fleft</span>
+<span id="cb165-123"><a href="causal-survival-analysis.html#cb165-123" tabindex="-1"></a>      <span class="cf">if</span> (test <span class="sc">&lt;</span> <span class="dv">0</span>){</span>
+<span id="cb165-124"><a href="causal-survival-analysis.html#cb165-124" tabindex="-1"></a>        right <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-125"><a href="causal-survival-analysis.html#cb165-125" tabindex="-1"></a>        fright <span class="ot">&lt;-</span> fmiddle</span>
+<span id="cb165-126"><a href="causal-survival-analysis.html#cb165-126" tabindex="-1"></a>      } <span class="cf">else</span> {</span>
+<span id="cb165-127"><a href="causal-survival-analysis.html#cb165-127" tabindex="-1"></a>        left <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-128"><a href="causal-survival-analysis.html#cb165-128" tabindex="-1"></a>        fleft <span class="ot">&lt;-</span> fmiddle</span>
+<span id="cb165-129"><a href="causal-survival-analysis.html#cb165-129" tabindex="-1"></a>      }</span>
+<span id="cb165-130"><a href="causal-survival-analysis.html#cb165-130" tabindex="-1"></a>      middle <span class="ot">&lt;-</span> (left <span class="sc">+</span> right) <span class="sc">/</span> <span class="dv">2</span></span>
+<span id="cb165-131"><a href="causal-survival-analysis.html#cb165-131" tabindex="-1"></a>      fmiddle <span class="ot">&lt;-</span> <span class="fu">for_conf</span>(middle)</span>
+<span id="cb165-132"><a href="causal-survival-analysis.html#cb165-132" tabindex="-1"></a>      diff <span class="ot">&lt;-</span> right <span class="sc">-</span> left</span>
+<span id="cb165-133"><a href="causal-survival-analysis.html#cb165-133" tabindex="-1"></a>      count <span class="ot">&lt;-</span> count <span class="sc">+</span> <span class="dv">1</span></span>
+<span id="cb165-134"><a href="causal-survival-analysis.html#cb165-134" tabindex="-1"></a>    }</span>
+<span id="cb165-135"><a href="causal-survival-analysis.html#cb165-135" tabindex="-1"></a>    psi_low <span class="ot">&lt;-</span> middle</span>
+<span id="cb165-136"><a href="causal-survival-analysis.html#cb165-136" tabindex="-1"></a>    objfunc_low <span class="ot">&lt;-</span> fmiddle <span class="sc">+</span> <span class="fl">3.84</span></span>
+<span id="cb165-137"><a href="causal-survival-analysis.html#cb165-137" tabindex="-1"></a>    psi <span class="ot">&lt;-</span> psi1</span>
+<span id="cb165-138"><a href="causal-survival-analysis.html#cb165-138" tabindex="-1"></a>  }</span>
+<span id="cb165-139"><a href="causal-survival-analysis.html#cb165-139" tabindex="-1"></a>}</span>
+<span id="cb165-140"><a href="causal-survival-analysis.html#cb165-140" tabindex="-1"></a><span class="fu">c</span>(psi, psi_low, psi_high)</span>
+<span id="cb165-141"><a href="causal-survival-analysis.html#cb165-141" tabindex="-1"></a><span class="co">#&gt; [1] -0.05041591 -0.22312099  0.33312901</span></span></code></pre></div>
 
 </div>
 </div>
diff --git a/docs/cibookex-r.epub b/docs/cibookex-r.epub
index 219c1a1..f0d8f28 100644
Binary files a/docs/cibookex-r.epub and b/docs/cibookex-r.epub differ
diff --git a/docs/cibookex-r.pdf b/docs/cibookex-r.pdf
index de59375..52fe2af 100644
Binary files a/docs/cibookex-r.pdf and b/docs/cibookex-r.pdf differ
diff --git a/docs/cibookex-r.tex b/docs/cibookex-r.tex
index 1252039..da48083 100644
--- a/docs/cibookex-r.tex
+++ b/docs/cibookex-r.tex
@@ -138,7 +138,7 @@
 
 \title{Causal Inference: What If. R and Stata code for Exercises}
 \author{Book by M. A. Hernán and J. M. Robins \and R code by Joy Shi and Sean McGrath \and Stata code by Eleanor Murray and Roger Logan \and R Markdown code by Tom Palmer}
-\date{25 April 2024}
+\date{16 June 2024}
 
 \begin{document}
 \maketitle
@@ -260,9 +260,19 @@ \section{Program 11.1}\label{program-11.1}
 \FunctionTok{summary}\NormalTok{(Y[A }\SpecialCharTok{==} \DecValTok{0}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    10.0    27.5    60.0    67.5    87.5   170.0}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(Y[A }\SpecialCharTok{==} \DecValTok{1}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    50.0   105.0   160.0   146.2   185.0   220.0}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{A2 }\OtherTok{\textless{}{-}} \FunctionTok{c}\NormalTok{(}\DecValTok{1}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{4}\NormalTok{, }\DecValTok{4}\NormalTok{, }\DecValTok{4}\NormalTok{, }\DecValTok{4}\NormalTok{)}
 \NormalTok{Y2 }\OtherTok{\textless{}{-}} \FunctionTok{c}\NormalTok{(}\DecValTok{110}\NormalTok{, }\DecValTok{80}\NormalTok{, }\DecValTok{50}\NormalTok{, }\DecValTok{40}\NormalTok{, }\DecValTok{170}\NormalTok{, }\DecValTok{30}\NormalTok{, }\DecValTok{70}\NormalTok{, }\DecValTok{50}\NormalTok{, }\DecValTok{110}\NormalTok{, }\DecValTok{50}\NormalTok{, }\DecValTok{180}\NormalTok{,}
@@ -279,12 +289,27 @@ \section{Program 11.1}\label{program-11.1}
 \FunctionTok{summary}\NormalTok{(Y2[A2 }\SpecialCharTok{==} \DecValTok{1}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    40.0    47.5    65.0    70.0    87.5   110.0}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(Y2[A2 }\SpecialCharTok{==} \DecValTok{2}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}      30      45      60      80      95     170}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(Y2[A2 }\SpecialCharTok{==} \DecValTok{3}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    50.0    95.0   120.0   117.5   142.5   180.0}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(Y2[A2 }\SpecialCharTok{==} \DecValTok{4}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   150.0   187.5   205.0   195.0   212.5   220.0}
@@ -337,9 +362,19 @@ \section{Program 11.2}\label{program-11.2}
 \CommentTok{\#\textgreater{} AIC: 170.43}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{predict}\NormalTok{(}\FunctionTok{glm}\NormalTok{(Y3 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ A3), }\FunctionTok{data.frame}\NormalTok{(}\AttributeTok{A3 =} \DecValTok{90}\NormalTok{))}
 \CommentTok{\#\textgreater{}      1 }
 \CommentTok{\#\textgreater{} 216.89}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{summary}\NormalTok{(}\FunctionTok{glm}\NormalTok{(Y }\SpecialCharTok{\textasciitilde{}}\NormalTok{ A))}
 \CommentTok{\#\textgreater{} }
@@ -398,6 +433,11 @@ \section{Program 11.3}\label{program-11.3}
 \CommentTok{\#\textgreater{} AIC: 170.39}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{predict}\NormalTok{(mod3, }\FunctionTok{data.frame}\NormalTok{(}\FunctionTok{cbind}\NormalTok{(}\AttributeTok{A3 =} \DecValTok{90}\NormalTok{, }\AttributeTok{Asq =} \DecValTok{8100}\NormalTok{)))}
 \CommentTok{\#\textgreater{}        1 }
 \CommentTok{\#\textgreater{} 197.1269}
@@ -441,91 +481,191 @@ \section{Program 12.1}\label{program-12.1}
 \CommentTok{\#\textgreater{} Coefficients:}
 \CommentTok{\#\textgreater{} (Intercept)         qsmk  }
 \CommentTok{\#\textgreater{}       1.984        2.541}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \CommentTok{\# Smoking cessation}
 \FunctionTok{predict}\NormalTok{(}\FunctionTok{lm}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\AttributeTok{data =}\NormalTok{ nhefs.nmv), }\FunctionTok{data.frame}\NormalTok{(}\AttributeTok{qsmk =} \DecValTok{1}\NormalTok{))}
 \CommentTok{\#\textgreater{}        1 }
 \CommentTok{\#\textgreater{} 4.525079}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \CommentTok{\# No smoking cessation}
 \FunctionTok{predict}\NormalTok{(}\FunctionTok{lm}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\AttributeTok{data =}\NormalTok{ nhefs.nmv), }\FunctionTok{data.frame}\NormalTok{(}\AttributeTok{qsmk =} \DecValTok{0}\NormalTok{))}
 \CommentTok{\#\textgreater{}        1 }
 \CommentTok{\#\textgreater{} 1.984498}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# Table}
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{0}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{age)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   25.00   33.00   42.00   42.79   51.00   72.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{0}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{wt71)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   40.82   59.19   68.49   70.30   79.38  151.73}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{0}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{smokeintensity)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    1.00   15.00   20.00   21.19   30.00   60.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{0}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{smokeyrs)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    1.00   15.00   23.00   24.09   32.00   64.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{age)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   25.00   35.00   46.00   46.17   56.00   74.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{wt71)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   39.58   60.67   71.21   72.35   81.08  136.98}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{smokeintensity)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}     1.0    10.0    20.0    18.6    25.0    80.0}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs.nmv[}\FunctionTok{which}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{smokeyrs)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    1.00   15.00   26.00   26.03   35.00   60.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{sex)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}       0   1}
 \CommentTok{\#\textgreater{}   0 542 621}
 \CommentTok{\#\textgreater{}   1 220 183}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{prop.table}\NormalTok{(}\FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{sex), }\DecValTok{1}\NormalTok{)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}             0         1}
 \CommentTok{\#\textgreater{}   0 0.4660361 0.5339639}
 \CommentTok{\#\textgreater{}   1 0.5459057 0.4540943}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{race)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}       0   1}
 \CommentTok{\#\textgreater{}   0 993 170}
 \CommentTok{\#\textgreater{}   1 367  36}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{prop.table}\NormalTok{(}\FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{race), }\DecValTok{1}\NormalTok{)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}              0          1}
 \CommentTok{\#\textgreater{}   0 0.85382631 0.14617369}
 \CommentTok{\#\textgreater{}   1 0.91066998 0.08933002}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{education)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}       1   2   3   4   5}
 \CommentTok{\#\textgreater{}   0 210 266 480  92 115}
 \CommentTok{\#\textgreater{}   1  81  74 157  29  62}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{prop.table}\NormalTok{(}\FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{education), }\DecValTok{1}\NormalTok{)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}              1          2          3          4          5}
 \CommentTok{\#\textgreater{}   0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220}
 \CommentTok{\#\textgreater{}   1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{exercise)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}       0   1   2}
 \CommentTok{\#\textgreater{}   0 237 485 441}
 \CommentTok{\#\textgreater{}   1  63 176 164}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{prop.table}\NormalTok{(}\FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{exercise), }\DecValTok{1}\NormalTok{)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}             0         1         2}
 \CommentTok{\#\textgreater{}   0 0.2037833 0.4170249 0.3791917}
 \CommentTok{\#\textgreater{}   1 0.1563275 0.4367246 0.4069479}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{active)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}       0   1   2}
 \CommentTok{\#\textgreater{}   0 532 527 104}
 \CommentTok{\#\textgreater{}   1 170 188  45}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{prop.table}\NormalTok{(}\FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk, nhefs.nmv}\SpecialCharTok{$}\NormalTok{active), }\DecValTok{1}\NormalTok{)}
 \CommentTok{\#\textgreater{}    }
 \CommentTok{\#\textgreater{}             0         1         2}
@@ -594,6 +734,11 @@ \section{Program 12.2}\label{program-12.2}
 \CommentTok{\#\textgreater{} AIC: 1714.9}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{p.qsmk.obs }\OtherTok{\textless{}{-}}
   \FunctionTok{ifelse}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk }\SpecialCharTok{==} \DecValTok{0}\NormalTok{,}
@@ -604,8 +749,18 @@ \section{Program 12.2}\label{program-12.2}
 \FunctionTok{summary}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{w)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   1.054   1.230   1.373   1.996   1.990  16.700}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{sd}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{w)}
 \CommentTok{\#\textgreater{} [1] 1.474787}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# install.packages("geepack") \# install package if required}
 \FunctionTok{library}\NormalTok{(}\StringTok{"geepack"}\NormalTok{)}
@@ -635,6 +790,11 @@ \section{Program 12.2}\label{program-12.2}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)    65.06   4.221}
 \CommentTok{\#\textgreater{} Number of clusters:   1566  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.w)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.w))[, }\DecValTok{2}\NormalTok{]}
@@ -644,6 +804,11 @@ \section{Program 12.2}\label{program-12.2}
 \CommentTok{\#\textgreater{}              beta   lcl  ucl}
 \CommentTok{\#\textgreater{} (Intercept) 1.780 1.340 2.22}
 \CommentTok{\#\textgreater{} qsmk        3.441 2.411 4.47}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# no association between sex and qsmk in pseudo{-}population}
 \FunctionTok{xtabs}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{w }\SpecialCharTok{\textasciitilde{}}\NormalTok{ nhefs.nmv}\SpecialCharTok{$}\NormalTok{sex }\SpecialCharTok{+}\NormalTok{ nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk)}
@@ -651,6 +816,11 @@ \section{Program 12.2}\label{program-12.2}
 \CommentTok{\#\textgreater{} nhefs.nmv$sex     0     1}
 \CommentTok{\#\textgreater{}             0 763.6 763.6}
 \CommentTok{\#\textgreater{}             1 801.7 797.2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# "check" for positivity (White women)}
 \FunctionTok{table}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{age[nhefs.nmv}\SpecialCharTok{$}\NormalTok{race }\SpecialCharTok{==} \DecValTok{0} \SpecialCharTok{\&}\NormalTok{ nhefs.nmv}\SpecialCharTok{$}\NormalTok{sex }\SpecialCharTok{==} \DecValTok{1}\NormalTok{],}
@@ -769,6 +939,11 @@ \section{Program 12.3}\label{program-12.3}
 \CommentTok{\#\textgreater{} AIC: 1715}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{pd.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(denom.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
@@ -792,6 +967,11 @@ \section{Program 12.3}\label{program-12.3}
 \CommentTok{\#\textgreater{} AIC: 1788}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{pn.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(numer.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
@@ -802,6 +982,11 @@ \section{Program 12.3}\label{program-12.3}
 \FunctionTok{summary}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{sw)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}   0.331   0.867   0.950   0.999   1.079   4.298}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 
 \NormalTok{msm.sw }\OtherTok{\textless{}{-}} \FunctionTok{geeglm}\NormalTok{(}
@@ -830,6 +1015,11 @@ \section{Program 12.3}\label{program-12.3}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)     60.7    3.71}
 \CommentTok{\#\textgreater{} Number of clusters:   1566  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.sw)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.sw))[, }\DecValTok{2}\NormalTok{]}
@@ -839,6 +1029,11 @@ \section{Program 12.3}\label{program-12.3}
 \CommentTok{\#\textgreater{}             beta  lcl  ucl}
 \CommentTok{\#\textgreater{} (Intercept) 1.78 1.34 2.22}
 \CommentTok{\#\textgreater{} qsmk        3.44 2.41 4.47}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# no association between sex and qsmk in pseudo{-}population}
 \FunctionTok{xtabs}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{sw }\SpecialCharTok{\textasciitilde{}}\NormalTok{ nhefs.nmv}\SpecialCharTok{$}\NormalTok{sex }\SpecialCharTok{+}\NormalTok{ nhefs.nmv}\SpecialCharTok{$}\NormalTok{qsmk)}
@@ -889,6 +1084,11 @@ \section{Program 12.4}\label{program-12.4}
 \FunctionTok{summary}\NormalTok{(nhefs.nmv.s}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    0.19    0.89    0.97    1.00    1.05    5.10}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{msm.sw.cont }\OtherTok{\textless{}{-}}
   \FunctionTok{geeglm}\NormalTok{(}
@@ -919,6 +1119,11 @@ \section{Program 12.4}\label{program-12.4}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)     60.5     4.5}
 \CommentTok{\#\textgreater{} Number of clusters:   1162  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.sw.cont)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.sw.cont))[, }\DecValTok{2}\NormalTok{]}
@@ -949,6 +1154,11 @@ \section{Program 12.5}\label{program-12.5}
 \CommentTok{\#\textgreater{}       0   1}
 \CommentTok{\#\textgreater{}   0 963 200}
 \CommentTok{\#\textgreater{}   1 312  91}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# First, estimation of stabilized weights sw (same as in Program 12.3)}
 \CommentTok{\# Second, fit logistic model below}
@@ -961,6 +1171,11 @@ \section{Program 12.5}\label{program-12.5}
   \AttributeTok{corstr =} \StringTok{"independence"}
 \NormalTok{)}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(msm.logistic)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Call:}
@@ -980,6 +1195,11 @@ \section{Program 12.5}\label{program-12.5}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)        1  0.0678}
 \CommentTok{\#\textgreater{} Number of clusters:   1566  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.logistic)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.logistic))[, }\DecValTok{2}\NormalTok{]}
@@ -1008,6 +1228,11 @@ \section{Program 12.6}\label{program-12.6}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}   0   1 }
 \CommentTok{\#\textgreater{} 762 804}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# estimation of denominator of ip weights}
 \NormalTok{denom.fit }\OtherTok{\textless{}{-}}
@@ -1058,6 +1283,11 @@ \section{Program 12.6}\label{program-12.6}
 \CommentTok{\#\textgreater{} AIC: 1715}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{pd.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(denom.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
@@ -1083,6 +1313,11 @@ \section{Program 12.6}\label{program-12.6}
 \CommentTok{\#\textgreater{} AIC: 1782}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{pn.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(numer.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
 \NormalTok{nhefs.nmv}\SpecialCharTok{$}\NormalTok{sw.a }\OtherTok{\textless{}{-}}
@@ -1092,8 +1327,18 @@ \section{Program 12.6}\label{program-12.6}
 \FunctionTok{summary}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    0.29    0.88    0.96    1.00    1.08    3.80}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{sd}\NormalTok{(nhefs.nmv}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{} [1] 0.271}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# Estimating parameters of a marginal structural mean model}
 \NormalTok{msm.emm }\OtherTok{\textless{}{-}} \FunctionTok{geeglm}\NormalTok{(}
@@ -1126,6 +1371,11 @@ \section{Program 12.6}\label{program-12.6}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)     60.8    3.71}
 \CommentTok{\#\textgreater{} Number of clusters:   1566  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.emm)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.emm))[, }\DecValTok{2}\NormalTok{]}
@@ -1157,13 +1407,28 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{}        0    1}
 \CommentTok{\#\textgreater{}   0 1163   38}
 \CommentTok{\#\textgreater{}   1  403   25}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{summary}\NormalTok{(nhefs[}\FunctionTok{which}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{cens }\SpecialCharTok{==} \DecValTok{0}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{wt71)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    39.6    59.5    69.2    70.8    79.8   151.7}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs[}\FunctionTok{which}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{cens }\SpecialCharTok{==} \DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{wt71)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    36.2    63.1    72.1    76.6    87.9   169.2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# estimation of denominator of ip weights for A}
 \NormalTok{denom.fit }\OtherTok{\textless{}{-}}
@@ -1214,6 +1479,11 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{} AIC: 1805}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{pd.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(denom.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
@@ -1237,6 +1507,11 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{} AIC: 1878}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{pn.qsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(numer.fit, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
 \CommentTok{\# estimation of denominator of ip weights for C}
@@ -1290,6 +1565,11 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{} AIC: 505.4}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 7}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{pd.cens }\OtherTok{\textless{}{-}} \DecValTok{1} \SpecialCharTok{{-}} \FunctionTok{predict}\NormalTok{(denom.cens, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
@@ -1315,6 +1595,11 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{} AIC: 531.8}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 6}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{pn.cens }\OtherTok{\textless{}{-}} \DecValTok{1} \SpecialCharTok{{-}} \FunctionTok{predict}\NormalTok{(numer.cens, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{sw.a }\OtherTok{\textless{}{-}}
@@ -1326,18 +1611,48 @@ \section{Program 12.7}\label{program-12.7}
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    0.33    0.86    0.95    1.00    1.08    4.21}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{sd}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{} [1] 0.284}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw.c)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    0.94    0.98    0.99    1.01    1.01    7.58}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{sd}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw.c)}
 \CommentTok{\#\textgreater{} [1] 0.178}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    0.35    0.86    0.94    1.01    1.08   12.86}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{sd}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw)}
 \CommentTok{\#\textgreater{} [1] 0.411}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{msm.sw }\OtherTok{\textless{}{-}} \FunctionTok{geeglm}\NormalTok{(}
 \NormalTok{  wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk,}
@@ -1365,6 +1680,11 @@ \section{Program 12.7}\label{program-12.7}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)     61.8    3.83}
 \CommentTok{\#\textgreater{} Number of clusters:   1566  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(msm.sw)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(msm.sw))[, }\DecValTok{2}\NormalTok{]}
@@ -1456,6 +1776,11 @@ \section{Program 13.1}\label{program-13.1}
 \CommentTok{\#\textgreater{} AIC: 10701}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{predicted.meanY }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(fit, nhefs)}
 
 \NormalTok{nhefs[}\FunctionTok{which}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{seqn }\SpecialCharTok{==} \DecValTok{24770}\NormalTok{), }\FunctionTok{c}\NormalTok{(}
@@ -1476,10 +1801,20 @@ \section{Program 13.1}\label{program-13.1}
 \CommentTok{\#\textgreater{}             \textless{}dbl\textgreater{} \textless{}dbl\textgreater{} \textless{}dbl\textgreater{} \textless{}dbl\textgreater{} \textless{}dbl\textgreater{}     \textless{}dbl\textgreater{}          \textless{}dbl\textgreater{}    \textless{}dbl\textgreater{}}
 \CommentTok{\#\textgreater{} 1           0.342     0     0     0    26         4             15       12}
 \CommentTok{\#\textgreater{} \# i 3 more variables: exercise \textless{}dbl\textgreater{}, active \textless{}dbl\textgreater{}, wt71 \textless{}dbl\textgreater{}}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{predicted.meanY[nhefs}\SpecialCharTok{$}\NormalTok{cens }\SpecialCharTok{==} \DecValTok{0}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{} {-}10.876   1.116   3.042   2.638   4.511   9.876}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{wt82\_71[nhefs}\SpecialCharTok{$}\NormalTok{cens }\SpecialCharTok{==} \DecValTok{0}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{} {-}41.280  {-}1.478   2.604   2.638   6.690  48.538}
@@ -1552,12 +1887,27 @@ \section{Program 13.2}\label{program-13.2}
 \CommentTok{\#\textgreater{} AIC: 35.385}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{table22}\SpecialCharTok{$}\NormalTok{predicted.meanY }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(glm.obj, table22)}
 
 \FunctionTok{mean}\NormalTok{(table22}\SpecialCharTok{$}\NormalTok{predicted.meanY[table22}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \SpecialCharTok{{-}}\DecValTok{1}\NormalTok{])}
 \CommentTok{\#\textgreater{} [1] 0.5}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{mean}\NormalTok{(table22}\SpecialCharTok{$}\NormalTok{predicted.meanY[table22}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \DecValTok{0}\NormalTok{])}
 \CommentTok{\#\textgreater{} [1] 0.5}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{mean}\NormalTok{(table22}\SpecialCharTok{$}\NormalTok{predicted.meanY[table22}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \DecValTok{1}\NormalTok{])}
 \CommentTok{\#\textgreater{} [1] 0.5}
 \end{Highlighting}
@@ -1646,6 +1996,11 @@ \section{Program 13.3}\label{program-13.3}
 \CommentTok{\#\textgreater{} AIC: 10701}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{onesample}\SpecialCharTok{$}\NormalTok{predicted\_meanY }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(std, onesample)}
 
 \CommentTok{\# estimate mean outcome in each of the groups interv=0, and interv=1}
@@ -1653,8 +2008,18 @@ \section{Program 13.3}\label{program-13.3}
 \CommentTok{\# of values of treatment and confounders, that is, the standardized outcome}
 \FunctionTok{mean}\NormalTok{(onesample[}\FunctionTok{which}\NormalTok{(onesample}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \SpecialCharTok{{-}}\DecValTok{1}\NormalTok{), ]}\SpecialCharTok{$}\NormalTok{predicted\_meanY)}
 \CommentTok{\#\textgreater{} [1] 2.56319}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{mean}\NormalTok{(onesample[}\FunctionTok{which}\NormalTok{(onesample}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \DecValTok{0}\NormalTok{), ]}\SpecialCharTok{$}\NormalTok{predicted\_meanY)}
 \CommentTok{\#\textgreater{} [1] 1.660267}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{mean}\NormalTok{(onesample[}\FunctionTok{which}\NormalTok{(onesample}\SpecialCharTok{$}\NormalTok{interv }\SpecialCharTok{==} \DecValTok{1}\NormalTok{), ]}\SpecialCharTok{$}\NormalTok{predicted\_meanY)}
 \CommentTok{\#\textgreater{} [1] 5.178841}
 \end{Highlighting}
@@ -1745,15 +2110,15 @@ \section{Program 13.4}\label{program-13.4}
 \NormalTok{  ))}
 \NormalTok{bootstrap}
 \CommentTok{\#\textgreater{}                         V1             mean                se               ll}
-\CommentTok{\#\textgreater{} 1                 Observed 2.56188497106099 0.250727758896328 2.07046759369974}
-\CommentTok{\#\textgreater{} 2             No Treatment 1.65212306626744 0.239947174585882 1.18183524588696}
-\CommentTok{\#\textgreater{} 3                Treatment 5.11474489549336 0.678045494452385 3.78580014648703}
-\CommentTok{\#\textgreater{} 4 Treatment {-} No Treatment 3.46262182922592 0.713424850039598 2.06433481747242}
+\CommentTok{\#\textgreater{} 1                 Observed 2.56188497106099 0.123459016607626 2.31990974494331}
+\CommentTok{\#\textgreater{} 2             No Treatment 1.65212306626744 0.141930671422846 1.37394406197707}
+\CommentTok{\#\textgreater{} 3                Treatment 5.11474489549336 0.354044979666702  4.4208294864394}
+\CommentTok{\#\textgreater{} 4 Treatment {-} No Treatment 3.46262182922592 0.380835968041716 2.71619704784671}
 \CommentTok{\#\textgreater{}                 ul}
-\CommentTok{\#\textgreater{} 1 3.05330234842223}
-\CommentTok{\#\textgreater{} 2 2.12241088664791}
-\CommentTok{\#\textgreater{} 3 6.44368964449968}
-\CommentTok{\#\textgreater{} 4 4.86090884097942}
+\CommentTok{\#\textgreater{} 1 2.80386019717867}
+\CommentTok{\#\textgreater{} 2  1.9303020705578}
+\CommentTok{\#\textgreater{} 3 5.80866030454731}
+\CommentTok{\#\textgreater{} 4 4.20904661060513}
 \end{Highlighting}
 \end{Shaded}
 
@@ -1793,6 +2158,11 @@ \section{Program 14.1}\label{program-14.1}
 \CommentTok{\#\textgreater{} The following objects are masked from \textquotesingle{}package:base\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     format.pval, units}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{describe}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{wt82\_71)}
 \CommentTok{\#\textgreater{} nhefs$wt82\_71 }
 \CommentTok{\#\textgreater{}        n  missing distinct     Info     Mean      Gmd      .05      .10 }
@@ -1802,6 +2172,11 @@ \section{Program 14.1}\label{program-14.1}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} lowest : {-}41.2805 {-}30.5019 {-}30.0501 {-}29.0258 {-}25.9706}
 \CommentTok{\#\textgreater{} highest: 34.0178  36.9693  37.6505  47.5113  48.5384}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# estimation of denominator of ip weights for C}
 \NormalTok{cw.denom }\OtherTok{\textless{}{-}} \FunctionTok{glm}\NormalTok{(cens}\SpecialCharTok{==}\DecValTok{0} \SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk }\SpecialCharTok{+}\NormalTok{ sex }\SpecialCharTok{+}\NormalTok{ race }\SpecialCharTok{+}\NormalTok{ age }\SpecialCharTok{+} \FunctionTok{I}\NormalTok{(age}\SpecialCharTok{\^{}}\DecValTok{2}\NormalTok{)}
@@ -1849,6 +2224,11 @@ \section{Program 14.1}\label{program-14.1}
 \CommentTok{\#\textgreater{} AIC: 505.36}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 7}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{pd.c }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(cw.denom, nhefs, }\AttributeTok{type=}\StringTok{"response"}\NormalTok{)}
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{wc }\OtherTok{\textless{}{-}} \FunctionTok{ifelse}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{cens}\SpecialCharTok{==}\DecValTok{0}\NormalTok{, }\DecValTok{1}\SpecialCharTok{/}\NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{pd.c, }\ConstantTok{NA}\NormalTok{)}
 \CommentTok{\# observations with cens=1 only contribute to censoring models}
@@ -1883,6 +2263,11 @@ \subsection{G-estimation: Checking one possible value of psi}\label{g-estimation
            \SpecialCharTok{+}\NormalTok{ wt71 }\SpecialCharTok{+} \FunctionTok{I}\NormalTok{(wt71}\SpecialCharTok{*}\NormalTok{wt71) }\SpecialCharTok{+}\NormalTok{ Hpsi, }\AttributeTok{family=}\NormalTok{binomial, }\AttributeTok{data=}\NormalTok{nhefs,}
            \AttributeTok{weights=}\NormalTok{wc, }\AttributeTok{id=}\NormalTok{seqn, }\AttributeTok{corstr=}\StringTok{"independence"}\NormalTok{)}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(fit)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Call:}
@@ -1980,6 +2365,11 @@ \subsection{G-estimation: Checking multiple possible values of psi}\label{g-esti
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{Hpsi.coefs}
 \CommentTok{\#\textgreater{}         Estimate  p{-}value}
 \CommentTok{\#\textgreater{}  [1,]  0.0267219 0.001772}
@@ -2038,6 +2428,11 @@ \subsection{G-estimation: Closed form estimator linear mean models}\label{g-esti
                  \SpecialCharTok{+}\NormalTok{ wt71 }\SpecialCharTok{+} \FunctionTok{I}\NormalTok{(wt71}\SpecialCharTok{\^{}}\DecValTok{2}\NormalTok{), }\AttributeTok{data =}\NormalTok{ nhefs, }\AttributeTok{weight =}\NormalTok{ wc,}
                  \AttributeTok{family =} \FunctionTok{binomial}\NormalTok{())}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(logit.est)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Call:}
@@ -2078,6 +2473,11 @@ \subsection{G-estimation: Closed form estimator linear mean models}\label{g-esti
 \CommentTok{\#\textgreater{} AIC: 1719}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{pqsmk }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(logit.est, nhefs, }\AttributeTok{type =} \StringTok{"response"}\NormalTok{)}
 \FunctionTok{describe}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{pqsmk)}
 \CommentTok{\#\textgreater{} nhefs$pqsmk }
@@ -2088,9 +2488,19 @@ \subsection{G-estimation: Closed form estimator linear mean models}\label{g-esti
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059}
 \CommentTok{\#\textgreater{} highest: 0.672083  0.686432  0.713913  0.733299  0.78914}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{pqsmk)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}  0.0514  0.1780  0.2426  0.2622  0.3251  0.7891}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# solve sum(w\_c * H(psi) * (qsmk {-} E[qsmk | L]))  = 0}
 \CommentTok{\# for a single psi and H(psi) = wt82\_71 {-} psi * qsmk}
@@ -2202,6 +2612,11 @@ \section{Program 15.1}\label{program-15.1}
 \CommentTok{\#\textgreater{} AIC: 10701}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# (step 1) build the contrast matrix with all zeros}
 \CommentTok{\# this function builds the blank matrix}
@@ -2216,6 +2631,11 @@ \section{Program 15.1}\label{program-15.1}
 \CommentTok{\#\textgreater{} The following object is masked from \textquotesingle{}package:MASS\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     geyser}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{makeContrastMatrix }\OtherTok{\textless{}{-}} \ControlFlowTok{function}\NormalTok{(model, nrow, names) \{}
 \NormalTok{  m }\OtherTok{\textless{}{-}} \FunctionTok{matrix}\NormalTok{(}\DecValTok{0}\NormalTok{, }\AttributeTok{nrow =}\NormalTok{ nrow, }\AttributeTok{ncol =} \FunctionTok{length}\NormalTok{(}\FunctionTok{coef}\NormalTok{(model)))}
   \FunctionTok{colnames}\NormalTok{(m) }\OtherTok{\textless{}{-}} \FunctionTok{names}\NormalTok{(}\FunctionTok{coef}\NormalTok{(model))}
@@ -2285,6 +2705,11 @@ \section{Program 15.1}\label{program-15.1}
 \CommentTok{\#\textgreater{}                                                    I(qsmk * smokeintensity)}
 \CommentTok{\#\textgreater{} Effect of Quitting Smoking at Smokeintensity of 5                         5}
 \CommentTok{\#\textgreater{} Effect of Quitting Smoking at Smokeintensity of 40                       40}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# (step 4) estimate the contrasts, get tests and confidence intervals for them}
 \NormalTok{estimates1 }\OtherTok{\textless{}{-}} \FunctionTok{glht}\NormalTok{(fit, K1)}
@@ -2308,6 +2733,11 @@ \section{Program 15.1}\label{program-15.1}
 \CommentTok{\#\textgreater{} {-}{-}{-}}
 \CommentTok{\#\textgreater{} Signif. codes:  0 \textquotesingle{}***\textquotesingle{} 0.001 \textquotesingle{}**\textquotesingle{} 0.01 \textquotesingle{}*\textquotesingle{} 0.05 \textquotesingle{}.\textquotesingle{} 0.1 \textquotesingle{} \textquotesingle{} 1}
 \CommentTok{\#\textgreater{} (Adjusted p values reported {-}{-} single{-}step method)}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
   \FunctionTok{confint}\NormalTok{(estimates1)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}   Simultaneous Confidence Intervals}
@@ -2326,6 +2756,11 @@ \section{Program 15.1}\label{program-15.1}
 \CommentTok{\#\textgreater{}                                                         Estimate lwr    upr   }
 \CommentTok{\#\textgreater{} Effect of Quitting Smoking at Smokeintensity of 5 == 0  2.7929   1.3039 4.2819}
 \CommentTok{\#\textgreater{} Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261   2.5372 6.3151}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# regression on covariates, not allowing for effect modification}
 \NormalTok{fit2 }\OtherTok{\textless{}{-}} \FunctionTok{glm}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk }\SpecialCharTok{+}\NormalTok{ sex }\SpecialCharTok{+}\NormalTok{ race }\SpecialCharTok{+}\NormalTok{ age }\SpecialCharTok{+} \FunctionTok{I}\NormalTok{(age}\SpecialCharTok{*}\NormalTok{age) }\SpecialCharTok{+} \FunctionTok{as.factor}\NormalTok{(education)}
@@ -2432,14 +2867,29 @@ \section{Program 15.2}\label{program-15.2}
 \CommentTok{\#\textgreater{} AIC: 1804.7}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 4}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{nhefs}\SpecialCharTok{$}\NormalTok{ps }\OtherTok{\textless{}{-}} \FunctionTok{predict}\NormalTok{(fit3, nhefs, }\AttributeTok{type=}\StringTok{"response"}\NormalTok{)}
 
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{ps[nhefs}\SpecialCharTok{$}\NormalTok{qsmk}\SpecialCharTok{==}\DecValTok{0}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{} 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{ps[nhefs}\SpecialCharTok{$}\NormalTok{qsmk}\SpecialCharTok{==}\DecValTok{1}\NormalTok{])}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{} 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# \# plotting the estimated propensity score}
 \CommentTok{\# install.packages("ggplot2") \# install packages if necessary}
@@ -2457,6 +2907,11 @@ \section{Program 15.2}\label{program-15.2}
 \CommentTok{\#\textgreater{} The following objects are masked from \textquotesingle{}package:base\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     intersect, setdiff, setequal, union}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{ggplot}\NormalTok{(nhefs, }\FunctionTok{aes}\NormalTok{(}\AttributeTok{x =}\NormalTok{ ps, }\AttributeTok{fill =}\NormalTok{ qsmk)) }\SpecialCharTok{+} \FunctionTok{geom\_density}\NormalTok{(}\AttributeTok{alpha =} \FloatTok{0.2}\NormalTok{) }\SpecialCharTok{+}
   \FunctionTok{xlab}\NormalTok{(}\StringTok{\textquotesingle{}Probability of Quitting Smoking During Follow{-}up\textquotesingle{}}\NormalTok{) }\SpecialCharTok{+}
   \FunctionTok{ggtitle}\NormalTok{(}\StringTok{\textquotesingle{}Propensity Score Distribution by Treatment Group\textquotesingle{}}\NormalTok{) }\SpecialCharTok{+}
@@ -2540,6 +2995,11 @@ \section{Program 15.3}\label{program-15.3}
 \CommentTok{\#\textgreater{} The following objects are masked from \textquotesingle{}package:ggplot2\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     \%+\%, alpha}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{describeBy}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{ps, }\FunctionTok{list}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{ps.dec, nhefs}\SpecialCharTok{$}\NormalTok{qsmk))}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  Descriptive statistics by group }
@@ -2642,6 +3102,11 @@ \section{Program 15.3}\label{program-15.3}
 \CommentTok{\#\textgreater{} : 1}
 \CommentTok{\#\textgreater{}    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se}
 \CommentTok{\#\textgreater{} X1    1 77 0.52 0.08   0.51    0.51 0.08 0.42 0.79  0.38 0.88     0.81 0.01}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# function to create deciles easily}
 \NormalTok{decile }\OtherTok{\textless{}{-}} \ControlFlowTok{function}\NormalTok{(x) \{}
@@ -2771,6 +3236,11 @@ \section{Program 15.3}\label{program-15.3}
 \CommentTok{\#\textgreater{} sample estimates:}
 \CommentTok{\#\textgreater{} mean in group 0 mean in group 1 }
 \CommentTok{\#\textgreater{}      {-}0.5043766       1.7358528}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# regression on PS deciles, not allowing for effect modification}
 \NormalTok{fit.psdec }\OtherTok{\textless{}{-}} \FunctionTok{glm}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk }\SpecialCharTok{+} \FunctionTok{as.factor}\NormalTok{(ps.dec), }\AttributeTok{data =}\NormalTok{ nhefs)}
@@ -2803,6 +3273,11 @@ \section{Program 15.3}\label{program-15.3}
 \CommentTok{\#\textgreater{} AIC: 10827}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{confint.lm}\NormalTok{(fit.psdec)}
 \CommentTok{\#\textgreater{}                         2.5 \%      97.5 \%}
 \CommentTok{\#\textgreater{} (Intercept)          2.556098  4.94486263}
@@ -2841,6 +3316,11 @@ \section{Program 15.4}\label{program-15.4}
 \CommentTok{\#\textgreater{} The following object is masked from \textquotesingle{}package:survival\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     aml}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# standardization by propensity score, agnostic regarding effect modification}
 \NormalTok{std.ps }\OtherTok{\textless{}{-}} \ControlFlowTok{function}\NormalTok{(data, indices) \{}
@@ -2891,15 +3371,15 @@ \section{Program 15.4}\label{program-15.4}
                                 \StringTok{"Treatment {-} No Treatment"}\NormalTok{), mean, se, ll, ul))}
 \NormalTok{bootstrap}
 \CommentTok{\#\textgreater{}                         V1             mean                se               ll}
-\CommentTok{\#\textgreater{} 1                 Observed 2.63384609228479 0.109279412225074 2.41966238007194}
-\CommentTok{\#\textgreater{} 2             No Treatment 1.71983636149845 0.238688300087521 1.25201588979582}
-\CommentTok{\#\textgreater{} 3                Treatment 5.35072300362985 0.565599408101867 4.24216853407302}
-\CommentTok{\#\textgreater{} 4 Treatment {-} No Treatment  3.6308866421314 0.684285112222335 2.28971246701867}
+\CommentTok{\#\textgreater{} 1                 Observed 2.63384609228479 0.177966260967055 2.28503863032611}
+\CommentTok{\#\textgreater{} 2             No Treatment 1.71983636149845 0.270728819824025 1.18921762506633}
+\CommentTok{\#\textgreater{} 3                Treatment 5.35072300362985 0.215967803091529 4.92743388775022}
+\CommentTok{\#\textgreater{} 4 Treatment {-} No Treatment  3.6308866421314 0.468506275891746 2.71263121485259}
 \CommentTok{\#\textgreater{}                 ul}
-\CommentTok{\#\textgreater{} 1 2.84802980449765}
-\CommentTok{\#\textgreater{} 2 2.18765683320108}
-\CommentTok{\#\textgreater{} 3 6.45927747318668}
-\CommentTok{\#\textgreater{} 4 4.97206081724413}
+\CommentTok{\#\textgreater{} 1 2.98265355424348}
+\CommentTok{\#\textgreater{} 2 2.25045509793058}
+\CommentTok{\#\textgreater{} 3 5.77401211950949}
+\CommentTok{\#\textgreater{} 4 4.54914206941021}
 \end{Highlighting}
 \end{Shaded}
 
@@ -2928,6 +3408,11 @@ \section{Program 15.4}\label{program-15.4}
 \CommentTok{\#\textgreater{} AIC: 10815}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 2}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# standarization on the propensity score}
 \CommentTok{\# (step 1) create two new datasets, one with all treated and one with all untreated}
@@ -2946,10 +3431,25 @@ \section{Program 15.4}\label{program-15.4}
 \NormalTok{mean0 }\OtherTok{\textless{}{-}} \FunctionTok{mean}\NormalTok{(untreated}\SpecialCharTok{$}\NormalTok{pred.y, }\AttributeTok{na.rm =} \ConstantTok{TRUE}\NormalTok{)}
 \NormalTok{mean1}
 \CommentTok{\#\textgreater{} [1] 5.250824}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{mean0}
 \CommentTok{\#\textgreater{} [1] 1.700228}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{mean1 }\SpecialCharTok{{-}}\NormalTok{ mean0}
 \CommentTok{\#\textgreater{} [1] 3.550596}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# (step 4) bootstrap a confidence interval}
 \CommentTok{\# number of bootstraps}
@@ -2993,7 +3493,7 @@ \section{Program 15.4}\label{program-15.4}
 \NormalTok{  \}}
 \NormalTok{\}}
 \CommentTok{\#\textgreater{} 95\% CI for the causal mean difference}
-\CommentTok{\#\textgreater{} 2.676706 , 4.551801}
+\CommentTok{\#\textgreater{} 2.538496 , 4.595036}
 \end{Highlighting}
 \end{Shaded}
 
@@ -3029,6 +3529,11 @@ \section{Program 16.1}\label{program-16.1}
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{price82)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA\textquotesingle{}s }
 \CommentTok{\#\textgreater{}   1.452   1.740   1.815   1.806   1.868   2.103      92}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# for simplicity, ignore subjects with missing outcome or missing instrument}
 \NormalTok{nhefs.iv }\OtherTok{\textless{}{-}}\NormalTok{ nhefs[}\FunctionTok{which}\NormalTok{(}\SpecialCharTok{!}\FunctionTok{is.na}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{wt82) }\SpecialCharTok{\&} \SpecialCharTok{!}\FunctionTok{is.na}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{price82)),]}
@@ -3039,6 +3544,11 @@ \section{Program 16.1}\label{program-16.1}
 \CommentTok{\#\textgreater{}        0    1}
 \CommentTok{\#\textgreater{}   0   33    8}
 \CommentTok{\#\textgreater{}   1 1065  370}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \FunctionTok{t.test}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ highprice, }\AttributeTok{data=}\NormalTok{nhefs.iv)}
 \CommentTok{\#\textgreater{} }
@@ -3088,6 +3598,11 @@ \section{Program 16.2}\label{program-16.2}
 \CommentTok{\#\textgreater{} qsmk         2.396270  19.840037 0.12078  0.90388}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Residual standard error: 7.8561141 on 1474 degrees of freedom}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{confint}\NormalTok{(model1)  }\CommentTok{\# note the wide confidence intervals}
 \CommentTok{\#\textgreater{}                  2.5 \%   97.5 \%}
 \CommentTok{\#\textgreater{} (Intercept)  {-}7.898445 12.03477}
@@ -3137,6 +3652,11 @@ \section{Program 16.3}\label{program-16.3}
 \CommentTok{\#\textgreater{}             Estimate Std.err}
 \CommentTok{\#\textgreater{} (Intercept)        1  0.7607}
 \CommentTok{\#\textgreater{} Number of clusters:   1476  Maximum cluster size: 1}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{beta }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(g.est)}
 \NormalTok{SE }\OtherTok{\textless{}{-}} \FunctionTok{coef}\NormalTok{(}\FunctionTok{summary}\NormalTok{(g.est))[,}\DecValTok{2}\NormalTok{]}
@@ -3178,6 +3698,11 @@ \section{Program 16.4}\label{program-16.4}
 \CommentTok{\#\textgreater{} qsmk           41.28     164.95   0.250    0.802}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Residual standard error: 18.6055 on 1474 degrees of freedom}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(}\FunctionTok{tsls}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\SpecialCharTok{\textasciitilde{}} \FunctionTok{ifelse}\NormalTok{(price82 }\SpecialCharTok{\textgreater{}=} \FloatTok{1.7}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{0}\NormalTok{), }\AttributeTok{data =}\NormalTok{ nhefs.iv))}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  2SLS Estimates}
@@ -3195,6 +3720,11 @@ \section{Program 16.4}\label{program-16.4}
 \CommentTok{\#\textgreater{} qsmk          {-}40.91     187.74  {-}0.218    0.828}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Residual standard error: 20.591 on 1474 degrees of freedom}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(}\FunctionTok{tsls}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\SpecialCharTok{\textasciitilde{}} \FunctionTok{ifelse}\NormalTok{(price82 }\SpecialCharTok{\textgreater{}=} \FloatTok{1.8}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{0}\NormalTok{), }\AttributeTok{data =}\NormalTok{ nhefs.iv))}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  2SLS Estimates}
@@ -3212,6 +3742,11 @@ \section{Program 16.4}\label{program-16.4}
 \CommentTok{\#\textgreater{} qsmk         {-}21.103     28.428  {-}0.742    0.458}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Residual standard error: 13.0188 on 1474 degrees of freedom}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(}\FunctionTok{tsls}\NormalTok{(wt82\_71 }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\SpecialCharTok{\textasciitilde{}} \FunctionTok{ifelse}\NormalTok{(price82 }\SpecialCharTok{\textgreater{}=} \FloatTok{1.9}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{0}\NormalTok{), }\AttributeTok{data =}\NormalTok{ nhefs.iv))}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  2SLS Estimates}
@@ -3317,9 +3852,19 @@ \section{Program 17.1}\label{program-17.1}
 \CommentTok{\#\textgreater{}       0   1}
 \CommentTok{\#\textgreater{}   0 985 326}
 \CommentTok{\#\textgreater{}   1 216 102}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(nhefs[}\FunctionTok{which}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{death}\SpecialCharTok{==}\DecValTok{1}\NormalTok{),]}\SpecialCharTok{$}\NormalTok{survtime)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}    1.00   35.00   61.00   61.14   86.75  120.00}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\#install.packages("survival")}
 \CommentTok{\#install.packages("ggplot2") \# for plots}
@@ -3333,6 +3878,11 @@ \section{Program 17.1}\label{program-17.1}
 \CommentTok{\#\textgreater{} The following object is masked from \textquotesingle{}package:survival\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     myeloma}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{survdiff}\NormalTok{(}\FunctionTok{Surv}\NormalTok{(survtime, death) }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\AttributeTok{data=}\NormalTok{nhefs)}
 \CommentTok{\#\textgreater{} Call:}
 \CommentTok{\#\textgreater{} survdiff(formula = Surv(survtime, death) \textasciitilde{} qsmk, data = nhefs)}
@@ -3342,6 +3892,11 @@ \section{Program 17.1}\label{program-17.1}
 \CommentTok{\#\textgreater{} qsmk=1  428      102     80.5      5.76      7.73}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  Chisq= 7.7  on 1 degrees of freedom, p= 0.005}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \NormalTok{fit }\OtherTok{\textless{}{-}} \FunctionTok{survfit}\NormalTok{(}\FunctionTok{Surv}\NormalTok{(survtime, death) }\SpecialCharTok{\textasciitilde{}}\NormalTok{ qsmk, }\AttributeTok{data=}\NormalTok{nhefs)}
 \FunctionTok{ggsurvplot}\NormalTok{(fit, }\AttributeTok{data =}\NormalTok{ nhefs, }\AttributeTok{xlab=}\StringTok{"Months of follow{-}up"}\NormalTok{,}
@@ -3400,6 +3955,11 @@ \section{Program 17.2}\label{program-17.2}
 \CommentTok{\#\textgreater{} AIC: 4643.3}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 9}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# creation of dataset with all time points under each treatment level}
 \NormalTok{qsmk0 }\OtherTok{\textless{}{-}} \FunctionTok{data.frame}\NormalTok{(}\FunctionTok{cbind}\NormalTok{(}\FunctionTok{seq}\NormalTok{(}\DecValTok{0}\NormalTok{, }\DecValTok{119}\NormalTok{),}\DecValTok{0}\NormalTok{,(}\FunctionTok{seq}\NormalTok{(}\DecValTok{0}\NormalTok{, }\DecValTok{119}\NormalTok{))}\SpecialCharTok{\^{}}\DecValTok{2}\NormalTok{))}
@@ -3467,6 +4027,11 @@ \section{Program 17.3}\label{program-17.3}
 \FunctionTok{summary}\NormalTok{(nhefs}\SpecialCharTok{$}\NormalTok{sw.a)}
 \CommentTok{\#\textgreater{}    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. }
 \CommentTok{\#\textgreater{}  0.3312  0.8640  0.9504  0.9991  1.0755  4.2054}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# creation of person{-}month data}
 \NormalTok{nhefs.ipw }\OtherTok{\textless{}{-}} \FunctionTok{expandRows}\NormalTok{(nhefs, }\StringTok{"survtime"}\NormalTok{, }\AttributeTok{drop=}\NormalTok{F)}
@@ -3480,6 +4045,11 @@ \section{Program 17.3}\label{program-17.3}
 \NormalTok{                   time }\SpecialCharTok{+}\NormalTok{ timesq, }\AttributeTok{family=}\FunctionTok{binomial}\NormalTok{(), }\AttributeTok{weight=}\NormalTok{sw.a,}
                  \AttributeTok{data=}\NormalTok{nhefs.ipw)}
 \CommentTok{\#\textgreater{} Warning in eval(family$initialize): non{-}integer \#successes in a binomial glm!}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \FunctionTok{summary}\NormalTok{(ipw.model)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Call:}
@@ -3504,6 +4074,11 @@ \section{Program 17.3}\label{program-17.3}
 \CommentTok{\#\textgreater{} AIC: 4633.5}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 9}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# creation of survival curves}
 \NormalTok{ipw.qsmk0 }\OtherTok{\textless{}{-}} \FunctionTok{data.frame}\NormalTok{(}\FunctionTok{cbind}\NormalTok{(}\FunctionTok{seq}\NormalTok{(}\DecValTok{0}\NormalTok{, }\DecValTok{119}\NormalTok{),}\DecValTok{0}\NormalTok{,(}\FunctionTok{seq}\NormalTok{(}\DecValTok{0}\NormalTok{, }\DecValTok{119}\NormalTok{))}\SpecialCharTok{\^{}}\DecValTok{2}\NormalTok{))}
@@ -3608,6 +4183,11 @@ \section{Program 17.4}\label{program-17.4}
 \CommentTok{\#\textgreater{} AIC: 4235.7}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} Number of Fisher Scoring iterations: 10}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 
 \CommentTok{\# creation of dataset with all time points for}
 \CommentTok{\# each individual under each treatment level}
@@ -3632,6 +4212,11 @@ \section{Program 17.4}\label{program-17.4}
 \CommentTok{\#\textgreater{} The following objects are masked from \textquotesingle{}package:base\textquotesingle{}:}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}     intersect, setdiff, setequal, union}
+\end{Highlighting}
+\end{Shaded}
+
+\begin{Shaded}
+\begin{Highlighting}[]
 \NormalTok{gf.qsmk0.surv }\OtherTok{\textless{}{-}}\NormalTok{ gf.qsmk0 }\SpecialCharTok{\%\textgreater{}\%} \FunctionTok{group\_by}\NormalTok{(seqn) }\SpecialCharTok{\%\textgreater{}\%} \FunctionTok{mutate}\NormalTok{(}\AttributeTok{surv0 =} \FunctionTok{cumprod}\NormalTok{(p.noevent0))}
 \NormalTok{gf.qsmk1.surv }\OtherTok{\textless{}{-}}\NormalTok{ gf.qsmk1 }\SpecialCharTok{\%\textgreater{}\%} \FunctionTok{group\_by}\NormalTok{(seqn) }\SpecialCharTok{\%\textgreater{}\%} \FunctionTok{mutate}\NormalTok{(}\AttributeTok{surv1 =} \FunctionTok{cumprod}\NormalTok{(p.noevent1))}
 
@@ -3831,31 +4416,31 @@ \chapter*{Session information: R}\label{session-information-r}
 \NormalTok{sessioninfo}\SpecialCharTok{::}\FunctionTok{session\_info}\NormalTok{()}
 \CommentTok{\#\textgreater{} {-} Session info {-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}}
 \CommentTok{\#\textgreater{}  setting  value}
-\CommentTok{\#\textgreater{}  version  R version 4.4.0 (2024{-}04{-}24)}
-\CommentTok{\#\textgreater{}  os       macOS Sonoma 14.4.1}
+\CommentTok{\#\textgreater{}  version  R version 4.4.1 (2024{-}06{-}14)}
+\CommentTok{\#\textgreater{}  os       macOS Sonoma 14.5}
 \CommentTok{\#\textgreater{}  system   aarch64, darwin20}
 \CommentTok{\#\textgreater{}  ui       X11}
 \CommentTok{\#\textgreater{}  language (EN)}
 \CommentTok{\#\textgreater{}  collate  en\_US.UTF{-}8}
 \CommentTok{\#\textgreater{}  ctype    en\_US.UTF{-}8}
 \CommentTok{\#\textgreater{}  tz       Europe/London}
-\CommentTok{\#\textgreater{}  date     2024{-}04{-}25}
-\CommentTok{\#\textgreater{}  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)}
+\CommentTok{\#\textgreater{}  date     2024{-}06{-}16}
+\CommentTok{\#\textgreater{}  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} {-} Packages {-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}}
 \CommentTok{\#\textgreater{}  package     * version date (UTC) lib source}
 \CommentTok{\#\textgreater{}  bookdown      0.39    2024{-}04{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  cli           3.6.2   2023{-}12{-}11 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  digest        0.6.35  2024{-}03{-}11 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  evaluate      0.23    2023{-}11{-}01 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  fastmap       1.1.1   2023{-}02{-}24 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  evaluate      0.24.0  2024{-}06{-}10 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  fastmap       1.2.0   2024{-}05{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  htmltools     0.5.8.1 2024{-}04{-}04 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  knitr         1.46    2024{-}04{-}06 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  rlang         1.1.3   2024{-}01{-}10 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  rmarkdown     2.26    2024{-}03{-}05 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  knitr         1.47    2024{-}05{-}29 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  rlang         1.1.4   2024{-}06{-}04 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  rmarkdown     2.27    2024{-}05{-}17 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  rstudioapi    0.16.0  2024{-}03{-}24 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  sessioninfo   1.2.2   2021{-}12{-}06 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  xfun          0.43    2024{-}03{-}25 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  xfun          0.44    2024{-}05{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  yaml          2.3.8   2023{-}12{-}11 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  [1] /Library/Frameworks/R.framework/Versions/4.4{-}arm64/Resources/library}
@@ -8964,7 +9549,7 @@ \section{Program 17.3}\label{program-17.3-1}
  26. drop if newseqn != 1  /* only need one pair */
  27.         
 
-r; t=0.00 14:51:11
+r; t=0.00 6:52:19
 
       Command: bootipw_surv
        PrY_a0: r(boot_0)
@@ -8972,7 +9557,7 @@ \section{Program 17.3}\label{program-17.3-1}
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=17.66 14:51:28
+r; t=19.63 6:52:38
 
 
 
@@ -9207,7 +9792,7 @@ \section{Program 17.4}\label{program-17.4-1}
                                                 observation
 
 
-file /Users/eptmp/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
+file /Users/tom/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG
     format
 
 (3,132 observations deleted)
@@ -9218,7 +9803,7 @@ \section{Program 17.4}\label{program-17.4-1}
   5. drop if time != 0       
   6. /*only predict on new version of data */
 
-r; t=0.00 14:51:35
+r; t=0.00 6:52:46
 
       Command: bootstdz_surv
        PrY_a0: r(boot_0)
@@ -9226,7 +9811,7 @@ \section{Program 17.4}\label{program-17.4-1}
    difference: r(boot_diff)
 
 Simulations (10): .........10 done
-r; t=22.00 14:51:57
+r; t=23.32 6:53:10
 
 
 
@@ -9264,11 +9849,11 @@ \chapter*{Session information: Stata}\label{session-information-stata}
 \end{Shaded}
 
 \begin{verbatim}
-Stata/MP 18.0 for Mac (Apple Silicon)
-Revision 04 Apr 2024
+StataNow/MP 18.5 for Mac (Apple Silicon)
+Revision 22 May 2024
 Copyright 1985-2023 StataCorp LLC
 
-Total physical memory: 18.00 GB
+Total physical memory: 8.01 GB
 
 Stata license: Unlimited-user 2-core network, expiring 29 Jan 2025
 Serial number: 501809305331
@@ -9282,32 +9867,32 @@ \chapter*{Session information: Stata}\label{session-information-stata}
 \NormalTok{sessioninfo}\SpecialCharTok{::}\FunctionTok{session\_info}\NormalTok{()}
 \CommentTok{\#\textgreater{} {-} Session info {-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}}
 \CommentTok{\#\textgreater{}  setting  value}
-\CommentTok{\#\textgreater{}  version  R version 4.4.0 (2024{-}04{-}24)}
-\CommentTok{\#\textgreater{}  os       macOS Sonoma 14.4.1}
+\CommentTok{\#\textgreater{}  version  R version 4.4.1 (2024{-}06{-}14)}
+\CommentTok{\#\textgreater{}  os       macOS Sonoma 14.5}
 \CommentTok{\#\textgreater{}  system   aarch64, darwin20}
 \CommentTok{\#\textgreater{}  ui       X11}
 \CommentTok{\#\textgreater{}  language (EN)}
 \CommentTok{\#\textgreater{}  collate  en\_US.UTF{-}8}
 \CommentTok{\#\textgreater{}  ctype    en\_US.UTF{-}8}
 \CommentTok{\#\textgreater{}  tz       Europe/London}
-\CommentTok{\#\textgreater{}  date     2024{-}04{-}25}
-\CommentTok{\#\textgreater{}  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)}
+\CommentTok{\#\textgreater{}  date     2024{-}06{-}16}
+\CommentTok{\#\textgreater{}  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{} {-} Packages {-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}{-}}
 \CommentTok{\#\textgreater{}  package       * version date (UTC) lib source}
 \CommentTok{\#\textgreater{}  bookdown        0.39    2024{-}04{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  cli             3.6.2   2023{-}12{-}11 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  digest          0.6.35  2024{-}03{-}11 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  evaluate        0.23    2023{-}11{-}01 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  fastmap         1.1.1   2023{-}02{-}24 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  evaluate        0.24.0  2024{-}06{-}10 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  fastmap         1.2.0   2024{-}05{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  htmltools       0.5.8.1 2024{-}04{-}04 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  knitr           1.46    2024{-}04{-}06 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  rlang           1.1.3   2024{-}01{-}10 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  rmarkdown       2.26    2024{-}03{-}05 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  knitr           1.47    2024{-}05{-}29 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  rlang           1.1.4   2024{-}06{-}04 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  rmarkdown       2.27    2024{-}05{-}17 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  rstudioapi      0.16.0  2024{-}03{-}24 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  sessioninfo     1.2.2   2021{-}12{-}06 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  Statamarkdown * 0.9.2   2023{-}12{-}04 [1] CRAN (R 4.4.0)}
-\CommentTok{\#\textgreater{}  xfun            0.43    2024{-}03{-}25 [1] CRAN (R 4.4.0)}
+\CommentTok{\#\textgreater{}  xfun            0.44    2024{-}05{-}15 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{}  yaml            2.3.8   2023{-}12{-}11 [1] CRAN (R 4.4.0)}
 \CommentTok{\#\textgreater{} }
 \CommentTok{\#\textgreater{}  [1] /Library/Frameworks/R.framework/Versions/4.4{-}arm64/Resources/library}
diff --git a/docs/g-estimation-of-structural-nested-models-stata.html b/docs/g-estimation-of-structural-nested-models-stata.html
index 16fb819..823f342 100644
--- a/docs/g-estimation-of-structural-nested-models-stata.html
+++ b/docs/g-estimation-of-structural-nested-models-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="g-estimation-of-structural-nested-models-stata" class="section level1 unnumbered hasAnchor">
 <h1>14. G-estimation of Structural Nested Models: Stata<a href="g-estimation-of-structural-nested-models-stata.html#g-estimation-of-structural-nested-models-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb94"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb94-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb94-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb211"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb211-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb211-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -324,33 +324,33 @@ <h2>Program 14.1<a href="g-estimation-of-structural-nested-models-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 14.4</li>
 </ul>
-<div class="sourceCode" id="cb96"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb96-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-1" tabindex="-1"></a><span class="co">/*For Stata 15 or later, first install the extremes function using this code:*/</span></span>
-<span id="cb96-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-2" tabindex="-1"></a>* <span class="kw">ssc</span> install extremes </span>
-<span id="cb96-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-3" tabindex="-1"></a></span>
-<span id="cb96-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-4" tabindex="-1"></a>*Data preprocessing***</span>
-<span id="cb96-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-5" tabindex="-1"></a></span>
-<span id="cb96-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-6" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
-<span id="cb96-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-7" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> cens = (wt82 == .)</span>
-<span id="cb96-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-8" tabindex="-1"></a></span>
-<span id="cb96-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-9" tabindex="-1"></a><span class="co">/*Ranking of extreme observations*/</span></span>
-<span id="cb96-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-10" tabindex="-1"></a>extremes wt82_71 seqn</span>
-<span id="cb96-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-11" tabindex="-1"></a></span>
-<span id="cb96-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-12" tabindex="-1"></a><span class="co">/*Estimate unstabilized censoring weights for use in g-estimation models*/</span></span>
-<span id="cb96-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-13" tabindex="-1"></a><span class="kw">glm</span> cens qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb96-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-14" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb96-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-15" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
-<span id="cb96-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-16" tabindex="-1"></a>  , <span class="kw">family</span>(binomial)</span>
-<span id="cb96-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-17" tabindex="-1"></a><span class="kw">predict</span> pr_cens</span>
-<span id="cb96-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-18" tabindex="-1"></a><span class="kw">gen</span> w_cens = 1/(1-pr_cens)</span>
-<span id="cb96-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-19" tabindex="-1"></a><span class="kw">replace</span> w_cens = . <span class="kw">if</span> cens == 1 </span>
-<span id="cb96-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-20" tabindex="-1"></a><span class="co">/*observations with cens = 1 contribute to censoring models but not outcome model*/</span></span>
-<span id="cb96-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-21" tabindex="-1"></a><span class="kw">summarize</span> w_cens</span>
-<span id="cb96-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-22" tabindex="-1"></a></span>
-<span id="cb96-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-23" tabindex="-1"></a><span class="co">/*Analyses restricted to N=1566*/</span></span>
-<span id="cb96-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-24" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82 == .</span>
-<span id="cb96-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-25" tabindex="-1"></a><span class="kw">summarize</span> wt82_71</span>
-<span id="cb96-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-26" tabindex="-1"></a></span>
-<span id="cb96-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb96-27" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb213"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb213-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-1" tabindex="-1"></a><span class="co">/*For Stata 15 or later, first install the extremes function using this code:*/</span></span>
+<span id="cb213-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-2" tabindex="-1"></a>* <span class="kw">ssc</span> install extremes </span>
+<span id="cb213-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-3" tabindex="-1"></a></span>
+<span id="cb213-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-4" tabindex="-1"></a>*Data preprocessing***</span>
+<span id="cb213-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-5" tabindex="-1"></a></span>
+<span id="cb213-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-6" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
+<span id="cb213-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-7" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> cens = (wt82 == .)</span>
+<span id="cb213-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-8" tabindex="-1"></a></span>
+<span id="cb213-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-9" tabindex="-1"></a><span class="co">/*Ranking of extreme observations*/</span></span>
+<span id="cb213-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-10" tabindex="-1"></a>extremes wt82_71 seqn</span>
+<span id="cb213-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-11" tabindex="-1"></a></span>
+<span id="cb213-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-12" tabindex="-1"></a><span class="co">/*Estimate unstabilized censoring weights for use in g-estimation models*/</span></span>
+<span id="cb213-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-13" tabindex="-1"></a><span class="kw">glm</span> cens qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb213-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-14" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb213-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-15" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
+<span id="cb213-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-16" tabindex="-1"></a>  , <span class="kw">family</span>(binomial)</span>
+<span id="cb213-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-17" tabindex="-1"></a><span class="kw">predict</span> pr_cens</span>
+<span id="cb213-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-18" tabindex="-1"></a><span class="kw">gen</span> w_cens = 1/(1-pr_cens)</span>
+<span id="cb213-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-19" tabindex="-1"></a><span class="kw">replace</span> w_cens = . <span class="kw">if</span> cens == 1 </span>
+<span id="cb213-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-20" tabindex="-1"></a><span class="co">/*observations with cens = 1 contribute to censoring models but not outcome model*/</span></span>
+<span id="cb213-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-21" tabindex="-1"></a><span class="kw">summarize</span> w_cens</span>
+<span id="cb213-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-22" tabindex="-1"></a></span>
+<span id="cb213-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-23" tabindex="-1"></a><span class="co">/*Analyses restricted to N=1566*/</span></span>
+<span id="cb213-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-24" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82 == .</span>
+<span id="cb213-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-25" tabindex="-1"></a><span class="kw">summarize</span> wt82_71</span>
+<span id="cb213-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-26" tabindex="-1"></a></span>
+<span id="cb213-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb213-27" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>  |  obs:        wt82_71    seqn |
   |------------------------------|
   | 1329.   -41.28046982   23321 |
@@ -454,68 +454,68 @@ <h2>Program 14.2<a href="g-estimation-of-structural-nested-models-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 14.5</li>
 </ul>
-<div class="sourceCode" id="cb98"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb98-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">clear</span></span>
-<span id="cb98-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-2" tabindex="-1"></a></span>
-<span id="cb98-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-3" tabindex="-1"></a><span class="co">/*Generate test value of Psi = 3.446*/</span></span>
-<span id="cb98-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-4" tabindex="-1"></a><span class="kw">gen</span> psi = 3.446</span>
-<span id="cb98-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-5" tabindex="-1"></a></span>
-<span id="cb98-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-6" tabindex="-1"></a><span class="co">/*Generate H(Psi) for each individual using test value of Psi and</span></span>
-<span id="cb98-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-7" tabindex="-1"></a><span class="co">their own values of weight change and smoking status*/</span></span>
-<span id="cb98-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-8" tabindex="-1"></a><span class="kw">gen</span> Hpsi = wt82_71 - psi * qsmk </span>
-<span id="cb98-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-9" tabindex="-1"></a></span>
-<span id="cb98-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-10" tabindex="-1"></a><span class="co">/*Fit a model for smoking status, given confounders and H(Psi) value, </span></span>
-<span id="cb98-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-11" tabindex="-1"></a><span class="co">with censoring weights and display H(Psi) coefficient*/</span></span>
-<span id="cb98-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-12" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb98-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-13" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb98-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-14" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 Hpsi <span class="co">///</span></span>
-<span id="cb98-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-15" tabindex="-1"></a>  [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
-<span id="cb98-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-16" tabindex="-1"></a><span class="kw">di</span> _b[Hpsi]</span>
-<span id="cb98-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-17" tabindex="-1"></a></span>
-<span id="cb98-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-18" tabindex="-1"></a><span class="co">/*G-estimation*/</span></span>
-<span id="cb98-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-19" tabindex="-1"></a><span class="co">/*Checking multiple possible values of psi*/</span></span>
-<span id="cb98-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-20" tabindex="-1"></a>cap <span class="kw">noi</span> <span class="kw">drop</span> psi Hpsi</span>
-<span id="cb98-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-21" tabindex="-1"></a></span>
-<span id="cb98-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-22" tabindex="-1"></a><span class="kw">local</span> seq_start = 2</span>
-<span id="cb98-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-23" tabindex="-1"></a><span class="kw">local</span> seq_end = 5</span>
-<span id="cb98-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-24" tabindex="-1"></a><span class="kw">local</span> seq_by = 0.1 <span class="co">// Setting seq_by = 0.01 will yield the result 3.46</span></span>
-<span id="cb98-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-25" tabindex="-1"></a><span class="kw">local</span> seq_len = (<span class="ot">`seq_end&#39;</span>-<span class="ot">`seq_start&#39;</span>)/<span class="ot">`seq_by&#39;</span> + 1</span>
-<span id="cb98-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-26" tabindex="-1"></a>                 </span>
-<span id="cb98-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-27" tabindex="-1"></a><span class="fu">matrix</span> results = <span class="fu">J</span>(<span class="ot">`seq_len&#39;</span>, 4, 0)</span>
-<span id="cb98-28"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-28" tabindex="-1"></a></span>
-<span id="cb98-29"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gen</span> psi = .</span>
-<span id="cb98-30"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-30" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gen</span> Hpsi = .</span>
-<span id="cb98-31"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-31" tabindex="-1"></a></span>
-<span id="cb98-32"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-32" tabindex="-1"></a><span class="kw">local</span> j = 0</span>
-<span id="cb98-33"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-33" tabindex="-1"></a></span>
-<span id="cb98-34"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-34" tabindex="-1"></a><span class="kw">forvalues</span> i =  <span class="ot">`seq_start&#39;</span>(<span class="ot">`seq_by&#39;</span>)<span class="ot">`seq_end&#39;</span> {</span>
-<span id="cb98-35"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-35" tabindex="-1"></a>    <span class="kw">local</span> j = <span class="ot">`j&#39;</span> + 1</span>
-<span id="cb98-36"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-36" tabindex="-1"></a>    <span class="kw">qui</span> <span class="kw">replace</span> psi = <span class="ot">`i&#39;</span></span>
-<span id="cb98-37"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-37" tabindex="-1"></a>    <span class="kw">qui</span> <span class="kw">replace</span> Hpsi = wt82_71 - psi * qsmk </span>
-<span id="cb98-38"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-38" tabindex="-1"></a>    <span class="kw">quietly</span> <span class="kw">logit</span> qsmk sex race c.age##c.age <span class="co">///</span></span>
-<span id="cb98-39"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-39" tabindex="-1"></a>      ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb98-40"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-40" tabindex="-1"></a>      c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb98-41"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-41" tabindex="-1"></a>      c.wt71##c.wt71 Hpsi <span class="co">///</span></span>
-<span id="cb98-42"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-42" tabindex="-1"></a>      [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
-<span id="cb98-43"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-43" tabindex="-1"></a>    <span class="fu">matrix</span> p_mat = <span class="fu">r</span>(<span class="kw">table</span>)</span>
-<span id="cb98-44"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-44" tabindex="-1"></a>    <span class="fu">matrix</span> p_mat = p_mat[<span class="st">&quot;pvalue&quot;</span>,<span class="st">&quot;qsmk:Hpsi&quot;</span>]</span>
-<span id="cb98-45"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-45" tabindex="-1"></a>    <span class="kw">local</span> <span class="kw">p</span> = p_mat[1,1]</span>
-<span id="cb98-46"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-46" tabindex="-1"></a>    <span class="kw">local</span> b = _b[Hpsi]</span>
-<span id="cb98-47"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-47" tabindex="-1"></a>    <span class="kw">di</span> <span class="st">&quot;coeff&quot;</span>, %6.3f <span class="ot">`b&#39;</span>, <span class="st">&quot;is generated from psi&quot;</span>, %4.1f <span class="ot">`i&#39;</span></span>
-<span id="cb98-48"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-48" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,1]= <span class="ot">`i&#39;</span></span>
-<span id="cb98-49"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-49" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,2]= <span class="ot">`b&#39;</span></span>
-<span id="cb98-50"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-50" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,3]= <span class="fu">abs</span>(<span class="ot">`b&#39;</span>)</span>
-<span id="cb98-51"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-51" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,4]= <span class="ot">`p&#39;</span></span>
-<span id="cb98-52"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-52" tabindex="-1"></a>}</span>
-<span id="cb98-53"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-53" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> results = <span class="st">&quot;psi&quot;</span> <span class="st">&quot;B(Hpsi)&quot;</span> <span class="st">&quot;AbsB(Hpsi)&quot;</span> <span class="st">&quot;pvalue&quot;</span></span>
-<span id="cb98-54"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-54" tabindex="-1"></a>mat li results </span>
-<span id="cb98-55"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-55" tabindex="-1"></a></span>
-<span id="cb98-56"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-56" tabindex="-1"></a><span class="kw">mata</span></span>
-<span id="cb98-57"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-57" tabindex="-1"></a>res = st_matrix(<span class="st">&quot;results&quot;</span>)</span>
-<span id="cb98-58"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-58" tabindex="-1"></a><span class="kw">for</span>(i=1; i&lt;= <span class="bn">rows</span>(res); i++) { </span>
-<span id="cb98-59"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-59" tabindex="-1"></a>  <span class="kw">if</span> (res[i,3] == <span class="kw">colmin</span>(res[,3])) res[i,1]</span>
-<span id="cb98-60"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-60" tabindex="-1"></a>}</span>
-<span id="cb98-61"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-61" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb98-62"><a href="g-estimation-of-structural-nested-models-stata.html#cb98-62" tabindex="-1"></a>* Setting seq_by = 0.01 will yield the result 3.46</span></code></pre></div>
+<div class="sourceCode" id="cb215"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb215-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">clear</span></span>
+<span id="cb215-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-2" tabindex="-1"></a></span>
+<span id="cb215-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-3" tabindex="-1"></a><span class="co">/*Generate test value of Psi = 3.446*/</span></span>
+<span id="cb215-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-4" tabindex="-1"></a><span class="kw">gen</span> psi = 3.446</span>
+<span id="cb215-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-5" tabindex="-1"></a></span>
+<span id="cb215-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-6" tabindex="-1"></a><span class="co">/*Generate H(Psi) for each individual using test value of Psi and</span></span>
+<span id="cb215-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-7" tabindex="-1"></a><span class="co">their own values of weight change and smoking status*/</span></span>
+<span id="cb215-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-8" tabindex="-1"></a><span class="kw">gen</span> Hpsi = wt82_71 - psi * qsmk </span>
+<span id="cb215-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-9" tabindex="-1"></a></span>
+<span id="cb215-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-10" tabindex="-1"></a><span class="co">/*Fit a model for smoking status, given confounders and H(Psi) value, </span></span>
+<span id="cb215-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-11" tabindex="-1"></a><span class="co">with censoring weights and display H(Psi) coefficient*/</span></span>
+<span id="cb215-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-12" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb215-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-13" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb215-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-14" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 Hpsi <span class="co">///</span></span>
+<span id="cb215-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-15" tabindex="-1"></a>  [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
+<span id="cb215-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-16" tabindex="-1"></a><span class="kw">di</span> _b[Hpsi]</span>
+<span id="cb215-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-17" tabindex="-1"></a></span>
+<span id="cb215-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-18" tabindex="-1"></a><span class="co">/*G-estimation*/</span></span>
+<span id="cb215-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-19" tabindex="-1"></a><span class="co">/*Checking multiple possible values of psi*/</span></span>
+<span id="cb215-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-20" tabindex="-1"></a>cap <span class="kw">noi</span> <span class="kw">drop</span> psi Hpsi</span>
+<span id="cb215-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-21" tabindex="-1"></a></span>
+<span id="cb215-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-22" tabindex="-1"></a><span class="kw">local</span> seq_start = 2</span>
+<span id="cb215-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-23" tabindex="-1"></a><span class="kw">local</span> seq_end = 5</span>
+<span id="cb215-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-24" tabindex="-1"></a><span class="kw">local</span> seq_by = 0.1 <span class="co">// Setting seq_by = 0.01 will yield the result 3.46</span></span>
+<span id="cb215-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-25" tabindex="-1"></a><span class="kw">local</span> seq_len = (<span class="ot">`seq_end&#39;</span>-<span class="ot">`seq_start&#39;</span>)/<span class="ot">`seq_by&#39;</span> + 1</span>
+<span id="cb215-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-26" tabindex="-1"></a>                 </span>
+<span id="cb215-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-27" tabindex="-1"></a><span class="fu">matrix</span> results = <span class="fu">J</span>(<span class="ot">`seq_len&#39;</span>, 4, 0)</span>
+<span id="cb215-28"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-28" tabindex="-1"></a></span>
+<span id="cb215-29"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gen</span> psi = .</span>
+<span id="cb215-30"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-30" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gen</span> Hpsi = .</span>
+<span id="cb215-31"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-31" tabindex="-1"></a></span>
+<span id="cb215-32"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-32" tabindex="-1"></a><span class="kw">local</span> j = 0</span>
+<span id="cb215-33"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-33" tabindex="-1"></a></span>
+<span id="cb215-34"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-34" tabindex="-1"></a><span class="kw">forvalues</span> i =  <span class="ot">`seq_start&#39;</span>(<span class="ot">`seq_by&#39;</span>)<span class="ot">`seq_end&#39;</span> {</span>
+<span id="cb215-35"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-35" tabindex="-1"></a>    <span class="kw">local</span> j = <span class="ot">`j&#39;</span> + 1</span>
+<span id="cb215-36"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-36" tabindex="-1"></a>    <span class="kw">qui</span> <span class="kw">replace</span> psi = <span class="ot">`i&#39;</span></span>
+<span id="cb215-37"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-37" tabindex="-1"></a>    <span class="kw">qui</span> <span class="kw">replace</span> Hpsi = wt82_71 - psi * qsmk </span>
+<span id="cb215-38"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-38" tabindex="-1"></a>    <span class="kw">quietly</span> <span class="kw">logit</span> qsmk sex race c.age##c.age <span class="co">///</span></span>
+<span id="cb215-39"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-39" tabindex="-1"></a>      ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb215-40"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-40" tabindex="-1"></a>      c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb215-41"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-41" tabindex="-1"></a>      c.wt71##c.wt71 Hpsi <span class="co">///</span></span>
+<span id="cb215-42"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-42" tabindex="-1"></a>      [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
+<span id="cb215-43"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-43" tabindex="-1"></a>    <span class="fu">matrix</span> p_mat = <span class="fu">r</span>(<span class="kw">table</span>)</span>
+<span id="cb215-44"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-44" tabindex="-1"></a>    <span class="fu">matrix</span> p_mat = p_mat[<span class="st">&quot;pvalue&quot;</span>,<span class="st">&quot;qsmk:Hpsi&quot;</span>]</span>
+<span id="cb215-45"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-45" tabindex="-1"></a>    <span class="kw">local</span> <span class="kw">p</span> = p_mat[1,1]</span>
+<span id="cb215-46"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-46" tabindex="-1"></a>    <span class="kw">local</span> b = _b[Hpsi]</span>
+<span id="cb215-47"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-47" tabindex="-1"></a>    <span class="kw">di</span> <span class="st">&quot;coeff&quot;</span>, %6.3f <span class="ot">`b&#39;</span>, <span class="st">&quot;is generated from psi&quot;</span>, %4.1f <span class="ot">`i&#39;</span></span>
+<span id="cb215-48"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-48" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,1]= <span class="ot">`i&#39;</span></span>
+<span id="cb215-49"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-49" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,2]= <span class="ot">`b&#39;</span></span>
+<span id="cb215-50"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-50" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,3]= <span class="fu">abs</span>(<span class="ot">`b&#39;</span>)</span>
+<span id="cb215-51"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-51" tabindex="-1"></a>    <span class="fu">matrix</span> results[<span class="ot">`j&#39;</span>,4]= <span class="ot">`p&#39;</span></span>
+<span id="cb215-52"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-52" tabindex="-1"></a>}</span>
+<span id="cb215-53"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-53" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> results = <span class="st">&quot;psi&quot;</span> <span class="st">&quot;B(Hpsi)&quot;</span> <span class="st">&quot;AbsB(Hpsi)&quot;</span> <span class="st">&quot;pvalue&quot;</span></span>
+<span id="cb215-54"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-54" tabindex="-1"></a>mat li results </span>
+<span id="cb215-55"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-55" tabindex="-1"></a></span>
+<span id="cb215-56"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-56" tabindex="-1"></a><span class="kw">mata</span></span>
+<span id="cb215-57"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-57" tabindex="-1"></a>res = st_matrix(<span class="st">&quot;results&quot;</span>)</span>
+<span id="cb215-58"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-58" tabindex="-1"></a><span class="kw">for</span>(i=1; i&lt;= <span class="bn">rows</span>(res); i++) { </span>
+<span id="cb215-59"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-59" tabindex="-1"></a>  <span class="kw">if</span> (res[i,3] == <span class="kw">colmin</span>(res[,3])) res[i,1]</span>
+<span id="cb215-60"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-60" tabindex="-1"></a>}</span>
+<span id="cb215-61"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-61" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb215-62"><a href="g-estimation-of-structural-nested-models-stata.html#cb215-62" tabindex="-1"></a>* Setting seq_by = 0.01 will yield the result 3.46</span></code></pre></div>
 <pre><code>Iteration 0:  Log pseudolikelihood = -936.10067  
 Iteration 1:  Log pseudolikelihood = -879.13942  
 Iteration 2:  Log pseudolikelihood = -877.82647  
@@ -678,44 +678,44 @@ <h2>Program 14.3<a href="g-estimation-of-structural-nested-models-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 14.6</li>
 </ul>
-<div class="sourceCode" id="cb100"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb100-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">clear</span></span>
-<span id="cb100-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-2" tabindex="-1"></a></span>
-<span id="cb100-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-3" tabindex="-1"></a><span class="co">/*create weights*/</span></span>
-<span id="cb100-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb100-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb100-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-6" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
-<span id="cb100-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-7" tabindex="-1"></a>  [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
-<span id="cb100-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-8" tabindex="-1"></a><span class="kw">predict</span> pr_qsmk</span>
-<span id="cb100-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-9" tabindex="-1"></a><span class="kw">summarize</span> pr_qsmk</span>
-<span id="cb100-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-10" tabindex="-1"></a></span>
-<span id="cb100-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-11" tabindex="-1"></a><span class="co">/* Closed form estimator linear mean models  **/</span></span>
-<span id="cb100-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-12" tabindex="-1"></a>* <span class="kw">ssc</span> install tomata</span>
-<span id="cb100-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-13" tabindex="-1"></a>putmata *, <span class="kw">replace</span></span>
-<span id="cb100-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-14" tabindex="-1"></a><span class="kw">mata</span>: <span class="fu">diff</span> = qsmk - pr_qsmk</span>
-<span id="cb100-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-15" tabindex="-1"></a><span class="kw">mata</span>: part1 = w_cens :* wt82_71 :* <span class="fu">diff</span></span>
-<span id="cb100-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-16" tabindex="-1"></a><span class="kw">mata</span>: part2 = w_cens :* qsmk :* <span class="fu">diff</span></span>
-<span id="cb100-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-17" tabindex="-1"></a><span class="kw">mata</span>: psi = <span class="kw">sum</span>(part1)/<span class="kw">sum</span>(part2)</span>
-<span id="cb100-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-18" tabindex="-1"></a></span>
-<span id="cb100-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-19" tabindex="-1"></a><span class="co">/*** Closed form estimator for 2-parameter model **/</span></span>
-<span id="cb100-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-20" tabindex="-1"></a><span class="kw">mata</span></span>
-<span id="cb100-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-21" tabindex="-1"></a><span class="fu">diff</span> = qsmk - pr_qsmk</span>
-<span id="cb100-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-22" tabindex="-1"></a>diff2 = w_cens :* <span class="fu">diff</span></span>
-<span id="cb100-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-23" tabindex="-1"></a></span>
-<span id="cb100-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-24" tabindex="-1"></a>lhs = <span class="fu">J</span>(2,2, 0)</span>
-<span id="cb100-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-25" tabindex="-1"></a>lhs[1,1] = <span class="kw">sum</span>( qsmk :* diff2)</span>
-<span id="cb100-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-26" tabindex="-1"></a>lhs[1,2] = <span class="kw">sum</span>( qsmk :* smokeintensity :* diff2 )</span>
-<span id="cb100-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-27" tabindex="-1"></a>lhs[2,1] = <span class="kw">sum</span>( qsmk :* smokeintensity :* diff2)</span>
-<span id="cb100-28"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-28" tabindex="-1"></a>lhs[2,2] = <span class="kw">sum</span>( qsmk :* smokeintensity :* smokeintensity :* diff2 )</span>
-<span id="cb100-29"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-29" tabindex="-1"></a>                                                                </span>
-<span id="cb100-30"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-30" tabindex="-1"></a>rhs = <span class="fu">J</span>(2,1,0)</span>
-<span id="cb100-31"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-31" tabindex="-1"></a>rhs[1] = <span class="kw">sum</span>(wt82_71 :* diff2 )</span>
-<span id="cb100-32"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-32" tabindex="-1"></a>rhs[2] = <span class="kw">sum</span>(wt82_71 :* smokeintensity :* diff2 )</span>
-<span id="cb100-33"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-33" tabindex="-1"></a></span>
-<span id="cb100-34"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-34" tabindex="-1"></a>psi = (<span class="kw">lusolve</span>(lhs, rhs))&#39;</span>
-<span id="cb100-35"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-35" tabindex="-1"></a>psi</span>
-<span id="cb100-36"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-36" tabindex="-1"></a>psi = (<span class="fu">invsym</span>(lhs&#39;lhs)*lhs&#39;rhs)&#39;</span>
-<span id="cb100-37"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-37" tabindex="-1"></a>psi</span>
-<span id="cb100-38"><a href="g-estimation-of-structural-nested-models-stata.html#cb100-38" tabindex="-1"></a><span class="kw">end</span></span></code></pre></div>
+<div class="sourceCode" id="cb217"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb217-1"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-wcens, <span class="kw">clear</span></span>
+<span id="cb217-2"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-2" tabindex="-1"></a></span>
+<span id="cb217-3"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-3" tabindex="-1"></a><span class="co">/*create weights*/</span></span>
+<span id="cb217-4"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb217-5"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb217-6"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-6" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
+<span id="cb217-7"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-7" tabindex="-1"></a>  [pw = w_cens], <span class="kw">cluster</span>(seqn)</span>
+<span id="cb217-8"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-8" tabindex="-1"></a><span class="kw">predict</span> pr_qsmk</span>
+<span id="cb217-9"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-9" tabindex="-1"></a><span class="kw">summarize</span> pr_qsmk</span>
+<span id="cb217-10"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-10" tabindex="-1"></a></span>
+<span id="cb217-11"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-11" tabindex="-1"></a><span class="co">/* Closed form estimator linear mean models  **/</span></span>
+<span id="cb217-12"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-12" tabindex="-1"></a>* <span class="kw">ssc</span> install tomata</span>
+<span id="cb217-13"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-13" tabindex="-1"></a>putmata *, <span class="kw">replace</span></span>
+<span id="cb217-14"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-14" tabindex="-1"></a><span class="kw">mata</span>: <span class="fu">diff</span> = qsmk - pr_qsmk</span>
+<span id="cb217-15"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-15" tabindex="-1"></a><span class="kw">mata</span>: part1 = w_cens :* wt82_71 :* <span class="fu">diff</span></span>
+<span id="cb217-16"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-16" tabindex="-1"></a><span class="kw">mata</span>: part2 = w_cens :* qsmk :* <span class="fu">diff</span></span>
+<span id="cb217-17"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-17" tabindex="-1"></a><span class="kw">mata</span>: psi = <span class="kw">sum</span>(part1)/<span class="kw">sum</span>(part2)</span>
+<span id="cb217-18"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-18" tabindex="-1"></a></span>
+<span id="cb217-19"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-19" tabindex="-1"></a><span class="co">/*** Closed form estimator for 2-parameter model **/</span></span>
+<span id="cb217-20"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-20" tabindex="-1"></a><span class="kw">mata</span></span>
+<span id="cb217-21"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-21" tabindex="-1"></a><span class="fu">diff</span> = qsmk - pr_qsmk</span>
+<span id="cb217-22"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-22" tabindex="-1"></a>diff2 = w_cens :* <span class="fu">diff</span></span>
+<span id="cb217-23"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-23" tabindex="-1"></a></span>
+<span id="cb217-24"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-24" tabindex="-1"></a>lhs = <span class="fu">J</span>(2,2, 0)</span>
+<span id="cb217-25"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-25" tabindex="-1"></a>lhs[1,1] = <span class="kw">sum</span>( qsmk :* diff2)</span>
+<span id="cb217-26"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-26" tabindex="-1"></a>lhs[1,2] = <span class="kw">sum</span>( qsmk :* smokeintensity :* diff2 )</span>
+<span id="cb217-27"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-27" tabindex="-1"></a>lhs[2,1] = <span class="kw">sum</span>( qsmk :* smokeintensity :* diff2)</span>
+<span id="cb217-28"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-28" tabindex="-1"></a>lhs[2,2] = <span class="kw">sum</span>( qsmk :* smokeintensity :* smokeintensity :* diff2 )</span>
+<span id="cb217-29"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-29" tabindex="-1"></a>                                                                </span>
+<span id="cb217-30"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-30" tabindex="-1"></a>rhs = <span class="fu">J</span>(2,1,0)</span>
+<span id="cb217-31"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-31" tabindex="-1"></a>rhs[1] = <span class="kw">sum</span>(wt82_71 :* diff2 )</span>
+<span id="cb217-32"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-32" tabindex="-1"></a>rhs[2] = <span class="kw">sum</span>(wt82_71 :* smokeintensity :* diff2 )</span>
+<span id="cb217-33"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-33" tabindex="-1"></a></span>
+<span id="cb217-34"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-34" tabindex="-1"></a>psi = (<span class="kw">lusolve</span>(lhs, rhs))&#39;</span>
+<span id="cb217-35"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-35" tabindex="-1"></a>psi</span>
+<span id="cb217-36"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-36" tabindex="-1"></a>psi = (<span class="fu">invsym</span>(lhs&#39;lhs)*lhs&#39;rhs)&#39;</span>
+<span id="cb217-37"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-37" tabindex="-1"></a>psi</span>
+<span id="cb217-38"><a href="g-estimation-of-structural-nested-models-stata.html#cb217-38" tabindex="-1"></a><span class="kw">end</span></span></code></pre></div>
 <pre><code>Iteration 0:  Log pseudolikelihood = -936.10067  
 Iteration 1:  Log pseudolikelihood = -879.13943  
 Iteration 2:  Log pseudolikelihood = -877.82647  
diff --git a/docs/g-estimation-of-structural-nested-models.html b/docs/g-estimation-of-structural-nested-models.html
index 9d1fa35..304f125 100644
--- a/docs/g-estimation-of-structural-nested-models.html
+++ b/docs/g-estimation-of-structural-nested-models.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -316,81 +316,81 @@ <h2>Program 14.1<a href="g-estimation-of-structural-nested-models.html#program-1
 <li>Preprocessing, ranks of extreme observations, IP weights for censoring</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb23"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb23-1"><a href="g-estimation-of-structural-nested-models.html#cb23-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb24"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb24-1"><a href="g-estimation-of-structural-nested-models.html#cb24-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
-<span id="cb24-2"><a href="g-estimation-of-structural-nested-models.html#cb24-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb24-3"><a href="g-estimation-of-structural-nested-models.html#cb24-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb24-4"><a href="g-estimation-of-structural-nested-models.html#cb24-4" tabindex="-1"></a></span>
-<span id="cb24-5"><a href="g-estimation-of-structural-nested-models.html#cb24-5" tabindex="-1"></a><span class="co"># some processing of the data</span></span>
-<span id="cb24-6"><a href="g-estimation-of-structural-nested-models.html#cb24-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb24-7"><a href="g-estimation-of-structural-nested-models.html#cb24-7" tabindex="-1"></a></span>
-<span id="cb24-8"><a href="g-estimation-of-structural-nested-models.html#cb24-8" tabindex="-1"></a><span class="co"># ranking of extreme observations</span></span>
-<span id="cb24-9"><a href="g-estimation-of-structural-nested-models.html#cb24-9" tabindex="-1"></a><span class="co">#install.packages(&quot;Hmisc&quot;)</span></span>
-<span id="cb24-10"><a href="g-estimation-of-structural-nested-models.html#cb24-10" tabindex="-1"></a><span class="fu">library</span>(Hmisc)</span>
-<span id="cb24-11"><a href="g-estimation-of-structural-nested-models.html#cb24-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-12"><a href="g-estimation-of-structural-nested-models.html#cb24-12" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;Hmisc&#39;</span></span>
-<span id="cb24-13"><a href="g-estimation-of-structural-nested-models.html#cb24-13" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
-<span id="cb24-14"><a href="g-estimation-of-structural-nested-models.html#cb24-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-15"><a href="g-estimation-of-structural-nested-models.html#cb24-15" tabindex="-1"></a><span class="co">#&gt;     format.pval, units</span></span>
-<span id="cb24-16"><a href="g-estimation-of-structural-nested-models.html#cb24-16" tabindex="-1"></a><span class="fu">describe</span>(nhefs<span class="sc">$</span>wt82_71)</span>
-<span id="cb24-17"><a href="g-estimation-of-structural-nested-models.html#cb24-17" tabindex="-1"></a><span class="co">#&gt; nhefs$wt82_71 </span></span>
-<span id="cb24-18"><a href="g-estimation-of-structural-nested-models.html#cb24-18" tabindex="-1"></a><span class="co">#&gt;        n  missing distinct     Info     Mean      Gmd      .05      .10 </span></span>
-<span id="cb24-19"><a href="g-estimation-of-structural-nested-models.html#cb24-19" tabindex="-1"></a><span class="co">#&gt;     1566       63     1510        1    2.638    8.337   -9.752   -6.292 </span></span>
-<span id="cb24-20"><a href="g-estimation-of-structural-nested-models.html#cb24-20" tabindex="-1"></a><span class="co">#&gt;      .25      .50      .75      .90      .95 </span></span>
-<span id="cb24-21"><a href="g-estimation-of-structural-nested-models.html#cb24-21" tabindex="-1"></a><span class="co">#&gt;   -1.478    2.604    6.690   11.117   14.739 </span></span>
-<span id="cb24-22"><a href="g-estimation-of-structural-nested-models.html#cb24-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-23"><a href="g-estimation-of-structural-nested-models.html#cb24-23" tabindex="-1"></a><span class="co">#&gt; lowest : -41.2805 -30.5019 -30.0501 -29.0258 -25.9706</span></span>
-<span id="cb24-24"><a href="g-estimation-of-structural-nested-models.html#cb24-24" tabindex="-1"></a><span class="co">#&gt; highest: 34.0178  36.9693  37.6505  47.5113  48.5384</span></span>
-<span id="cb24-25"><a href="g-estimation-of-structural-nested-models.html#cb24-25" tabindex="-1"></a></span>
-<span id="cb24-26"><a href="g-estimation-of-structural-nested-models.html#cb24-26" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for C</span></span>
-<span id="cb24-27"><a href="g-estimation-of-structural-nested-models.html#cb24-27" tabindex="-1"></a>cw.denom <span class="ot">&lt;-</span> <span class="fu">glm</span>(cens<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">^</span><span class="dv">2</span>)</span>
-<span id="cb24-28"><a href="g-estimation-of-structural-nested-models.html#cb24-28" tabindex="-1"></a>                     <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">^</span><span class="dv">2</span>)</span>
-<span id="cb24-29"><a href="g-estimation-of-structural-nested-models.html#cb24-29" tabindex="-1"></a>                     <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb24-30"><a href="g-estimation-of-structural-nested-models.html#cb24-30" tabindex="-1"></a>                     <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">^</span><span class="dv">2</span>),</span>
-<span id="cb24-31"><a href="g-estimation-of-structural-nested-models.html#cb24-31" tabindex="-1"></a>                     <span class="at">data =</span> nhefs, <span class="at">family =</span> <span class="fu">binomial</span>(<span class="st">&quot;logit&quot;</span>))</span>
-<span id="cb24-32"><a href="g-estimation-of-structural-nested-models.html#cb24-32" tabindex="-1"></a><span class="fu">summary</span>(cw.denom)</span>
-<span id="cb24-33"><a href="g-estimation-of-structural-nested-models.html#cb24-33" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-34"><a href="g-estimation-of-structural-nested-models.html#cb24-34" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb24-35"><a href="g-estimation-of-structural-nested-models.html#cb24-35" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens == 0 ~ qsmk + sex + race + age + I(age^2) + </span></span>
-<span id="cb24-36"><a href="g-estimation-of-structural-nested-models.html#cb24-36" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
-<span id="cb24-37"><a href="g-estimation-of-structural-nested-models.html#cb24-37" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb24-38"><a href="g-estimation-of-structural-nested-models.html#cb24-38" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(&quot;logit&quot;), data = nhefs)</span></span>
-<span id="cb24-39"><a href="g-estimation-of-structural-nested-models.html#cb24-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-40"><a href="g-estimation-of-structural-nested-models.html#cb24-40" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb24-41"><a href="g-estimation-of-structural-nested-models.html#cb24-41" tabindex="-1"></a><span class="co">#&gt;                         Estimate Std. Error z value Pr(&gt;|z|)   </span></span>
-<span id="cb24-42"><a href="g-estimation-of-structural-nested-models.html#cb24-42" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -4.0144661  2.5761058  -1.558  0.11915   </span></span>
-<span id="cb24-43"><a href="g-estimation-of-structural-nested-models.html#cb24-43" tabindex="-1"></a><span class="co">#&gt; qsmk                  -0.5168674  0.2877162  -1.796  0.07242 . </span></span>
-<span id="cb24-44"><a href="g-estimation-of-structural-nested-models.html#cb24-44" tabindex="-1"></a><span class="co">#&gt; sex                   -0.0573131  0.3302775  -0.174  0.86223   </span></span>
-<span id="cb24-45"><a href="g-estimation-of-structural-nested-models.html#cb24-45" tabindex="-1"></a><span class="co">#&gt; race                   0.0122715  0.4524887   0.027  0.97836   </span></span>
-<span id="cb24-46"><a href="g-estimation-of-structural-nested-models.html#cb24-46" tabindex="-1"></a><span class="co">#&gt; age                    0.2697293  0.1174647   2.296  0.02166 * </span></span>
-<span id="cb24-47"><a href="g-estimation-of-structural-nested-models.html#cb24-47" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.0028837  0.0011135  -2.590  0.00961 **</span></span>
-<span id="cb24-48"><a href="g-estimation-of-structural-nested-models.html#cb24-48" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2  0.4407884  0.4193993   1.051  0.29326   </span></span>
-<span id="cb24-49"><a href="g-estimation-of-structural-nested-models.html#cb24-49" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.1646881  0.3705471   0.444  0.65672   </span></span>
-<span id="cb24-50"><a href="g-estimation-of-structural-nested-models.html#cb24-50" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4 -0.1384470  0.5697969  -0.243  0.80802   </span></span>
-<span id="cb24-51"><a href="g-estimation-of-structural-nested-models.html#cb24-51" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.3823818  0.5601808   0.683  0.49486   </span></span>
-<span id="cb24-52"><a href="g-estimation-of-structural-nested-models.html#cb24-52" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.0157119  0.0347319  -0.452  0.65100   </span></span>
-<span id="cb24-53"><a href="g-estimation-of-structural-nested-models.html#cb24-53" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.0001133  0.0006058   0.187  0.85171   </span></span>
-<span id="cb24-54"><a href="g-estimation-of-structural-nested-models.html#cb24-54" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.0785973  0.0749576  -1.049  0.29438   </span></span>
-<span id="cb24-55"><a href="g-estimation-of-structural-nested-models.html#cb24-55" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.0005569  0.0010318   0.540  0.58938   </span></span>
-<span id="cb24-56"><a href="g-estimation-of-structural-nested-models.html#cb24-56" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.9714714  0.3878101   2.505  0.01224 * </span></span>
-<span id="cb24-57"><a href="g-estimation-of-structural-nested-models.html#cb24-57" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.5839890  0.3723133   1.569  0.11675   </span></span>
-<span id="cb24-58"><a href="g-estimation-of-structural-nested-models.html#cb24-58" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.2474785  0.3254548   0.760  0.44701   </span></span>
-<span id="cb24-59"><a href="g-estimation-of-structural-nested-models.html#cb24-59" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2    -0.7065829  0.3964577  -1.782  0.07471 . </span></span>
-<span id="cb24-60"><a href="g-estimation-of-structural-nested-models.html#cb24-60" tabindex="-1"></a><span class="co">#&gt; wt71                   0.0878871  0.0400115   2.197  0.02805 * </span></span>
-<span id="cb24-61"><a href="g-estimation-of-structural-nested-models.html#cb24-61" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)             -0.0006351  0.0002257  -2.813  0.00490 **</span></span>
-<span id="cb24-62"><a href="g-estimation-of-structural-nested-models.html#cb24-62" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb24-63"><a href="g-estimation-of-structural-nested-models.html#cb24-63" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb24-64"><a href="g-estimation-of-structural-nested-models.html#cb24-64" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-65"><a href="g-estimation-of-structural-nested-models.html#cb24-65" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb24-66"><a href="g-estimation-of-structural-nested-models.html#cb24-66" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-67"><a href="g-estimation-of-structural-nested-models.html#cb24-67" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
-<span id="cb24-68"><a href="g-estimation-of-structural-nested-models.html#cb24-68" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 465.36  on 1609  degrees of freedom</span></span>
-<span id="cb24-69"><a href="g-estimation-of-structural-nested-models.html#cb24-69" tabindex="-1"></a><span class="co">#&gt; AIC: 505.36</span></span>
-<span id="cb24-70"><a href="g-estimation-of-structural-nested-models.html#cb24-70" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb24-71"><a href="g-estimation-of-structural-nested-models.html#cb24-71" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 7</span></span>
-<span id="cb24-72"><a href="g-estimation-of-structural-nested-models.html#cb24-72" tabindex="-1"></a>nhefs<span class="sc">$</span>pd.c <span class="ot">&lt;-</span> <span class="fu">predict</span>(cw.denom, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb24-73"><a href="g-estimation-of-structural-nested-models.html#cb24-73" tabindex="-1"></a>nhefs<span class="sc">$</span>wc <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>cens<span class="sc">==</span><span class="dv">0</span>, <span class="dv">1</span><span class="sc">/</span>nhefs<span class="sc">$</span>pd.c, <span class="cn">NA</span>)</span>
-<span id="cb24-74"><a href="g-estimation-of-structural-nested-models.html#cb24-74" tabindex="-1"></a><span class="co"># observations with cens=1 only contribute to censoring models</span></span></code></pre></div>
+<div class="sourceCode" id="cb96"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb96-1"><a href="g-estimation-of-structural-nested-models.html#cb96-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb97"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb97-1"><a href="g-estimation-of-structural-nested-models.html#cb97-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
+<span id="cb97-2"><a href="g-estimation-of-structural-nested-models.html#cb97-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb97-3"><a href="g-estimation-of-structural-nested-models.html#cb97-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb97-4"><a href="g-estimation-of-structural-nested-models.html#cb97-4" tabindex="-1"></a></span>
+<span id="cb97-5"><a href="g-estimation-of-structural-nested-models.html#cb97-5" tabindex="-1"></a><span class="co"># some processing of the data</span></span>
+<span id="cb97-6"><a href="g-estimation-of-structural-nested-models.html#cb97-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb97-7"><a href="g-estimation-of-structural-nested-models.html#cb97-7" tabindex="-1"></a></span>
+<span id="cb97-8"><a href="g-estimation-of-structural-nested-models.html#cb97-8" tabindex="-1"></a><span class="co"># ranking of extreme observations</span></span>
+<span id="cb97-9"><a href="g-estimation-of-structural-nested-models.html#cb97-9" tabindex="-1"></a><span class="co">#install.packages(&quot;Hmisc&quot;)</span></span>
+<span id="cb97-10"><a href="g-estimation-of-structural-nested-models.html#cb97-10" tabindex="-1"></a><span class="fu">library</span>(Hmisc)</span>
+<span id="cb97-11"><a href="g-estimation-of-structural-nested-models.html#cb97-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb97-12"><a href="g-estimation-of-structural-nested-models.html#cb97-12" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;Hmisc&#39;</span></span>
+<span id="cb97-13"><a href="g-estimation-of-structural-nested-models.html#cb97-13" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
+<span id="cb97-14"><a href="g-estimation-of-structural-nested-models.html#cb97-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb97-15"><a href="g-estimation-of-structural-nested-models.html#cb97-15" tabindex="-1"></a><span class="co">#&gt;     format.pval, units</span></span></code></pre></div>
+<div class="sourceCode" id="cb98"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb98-1"><a href="g-estimation-of-structural-nested-models.html#cb98-1" tabindex="-1"></a><span class="fu">describe</span>(nhefs<span class="sc">$</span>wt82_71)</span>
+<span id="cb98-2"><a href="g-estimation-of-structural-nested-models.html#cb98-2" tabindex="-1"></a><span class="co">#&gt; nhefs$wt82_71 </span></span>
+<span id="cb98-3"><a href="g-estimation-of-structural-nested-models.html#cb98-3" tabindex="-1"></a><span class="co">#&gt;        n  missing distinct     Info     Mean      Gmd      .05      .10 </span></span>
+<span id="cb98-4"><a href="g-estimation-of-structural-nested-models.html#cb98-4" tabindex="-1"></a><span class="co">#&gt;     1566       63     1510        1    2.638    8.337   -9.752   -6.292 </span></span>
+<span id="cb98-5"><a href="g-estimation-of-structural-nested-models.html#cb98-5" tabindex="-1"></a><span class="co">#&gt;      .25      .50      .75      .90      .95 </span></span>
+<span id="cb98-6"><a href="g-estimation-of-structural-nested-models.html#cb98-6" tabindex="-1"></a><span class="co">#&gt;   -1.478    2.604    6.690   11.117   14.739 </span></span>
+<span id="cb98-7"><a href="g-estimation-of-structural-nested-models.html#cb98-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb98-8"><a href="g-estimation-of-structural-nested-models.html#cb98-8" tabindex="-1"></a><span class="co">#&gt; lowest : -41.2805 -30.5019 -30.0501 -29.0258 -25.9706</span></span>
+<span id="cb98-9"><a href="g-estimation-of-structural-nested-models.html#cb98-9" tabindex="-1"></a><span class="co">#&gt; highest: 34.0178  36.9693  37.6505  47.5113  48.5384</span></span></code></pre></div>
+<div class="sourceCode" id="cb99"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb99-1"><a href="g-estimation-of-structural-nested-models.html#cb99-1" tabindex="-1"></a></span>
+<span id="cb99-2"><a href="g-estimation-of-structural-nested-models.html#cb99-2" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for C</span></span>
+<span id="cb99-3"><a href="g-estimation-of-structural-nested-models.html#cb99-3" tabindex="-1"></a>cw.denom <span class="ot">&lt;-</span> <span class="fu">glm</span>(cens<span class="sc">==</span><span class="dv">0</span> <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">^</span><span class="dv">2</span>)</span>
+<span id="cb99-4"><a href="g-estimation-of-structural-nested-models.html#cb99-4" tabindex="-1"></a>                     <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">^</span><span class="dv">2</span>)</span>
+<span id="cb99-5"><a href="g-estimation-of-structural-nested-models.html#cb99-5" tabindex="-1"></a>                     <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb99-6"><a href="g-estimation-of-structural-nested-models.html#cb99-6" tabindex="-1"></a>                     <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">^</span><span class="dv">2</span>),</span>
+<span id="cb99-7"><a href="g-estimation-of-structural-nested-models.html#cb99-7" tabindex="-1"></a>                     <span class="at">data =</span> nhefs, <span class="at">family =</span> <span class="fu">binomial</span>(<span class="st">&quot;logit&quot;</span>))</span>
+<span id="cb99-8"><a href="g-estimation-of-structural-nested-models.html#cb99-8" tabindex="-1"></a><span class="fu">summary</span>(cw.denom)</span>
+<span id="cb99-9"><a href="g-estimation-of-structural-nested-models.html#cb99-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb99-10"><a href="g-estimation-of-structural-nested-models.html#cb99-10" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb99-11"><a href="g-estimation-of-structural-nested-models.html#cb99-11" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens == 0 ~ qsmk + sex + race + age + I(age^2) + </span></span>
+<span id="cb99-12"><a href="g-estimation-of-structural-nested-models.html#cb99-12" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
+<span id="cb99-13"><a href="g-estimation-of-structural-nested-models.html#cb99-13" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb99-14"><a href="g-estimation-of-structural-nested-models.html#cb99-14" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(&quot;logit&quot;), data = nhefs)</span></span>
+<span id="cb99-15"><a href="g-estimation-of-structural-nested-models.html#cb99-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb99-16"><a href="g-estimation-of-structural-nested-models.html#cb99-16" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb99-17"><a href="g-estimation-of-structural-nested-models.html#cb99-17" tabindex="-1"></a><span class="co">#&gt;                         Estimate Std. Error z value Pr(&gt;|z|)   </span></span>
+<span id="cb99-18"><a href="g-estimation-of-structural-nested-models.html#cb99-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -4.0144661  2.5761058  -1.558  0.11915   </span></span>
+<span id="cb99-19"><a href="g-estimation-of-structural-nested-models.html#cb99-19" tabindex="-1"></a><span class="co">#&gt; qsmk                  -0.5168674  0.2877162  -1.796  0.07242 . </span></span>
+<span id="cb99-20"><a href="g-estimation-of-structural-nested-models.html#cb99-20" tabindex="-1"></a><span class="co">#&gt; sex                   -0.0573131  0.3302775  -0.174  0.86223   </span></span>
+<span id="cb99-21"><a href="g-estimation-of-structural-nested-models.html#cb99-21" tabindex="-1"></a><span class="co">#&gt; race                   0.0122715  0.4524887   0.027  0.97836   </span></span>
+<span id="cb99-22"><a href="g-estimation-of-structural-nested-models.html#cb99-22" tabindex="-1"></a><span class="co">#&gt; age                    0.2697293  0.1174647   2.296  0.02166 * </span></span>
+<span id="cb99-23"><a href="g-estimation-of-structural-nested-models.html#cb99-23" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.0028837  0.0011135  -2.590  0.00961 **</span></span>
+<span id="cb99-24"><a href="g-estimation-of-structural-nested-models.html#cb99-24" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2  0.4407884  0.4193993   1.051  0.29326   </span></span>
+<span id="cb99-25"><a href="g-estimation-of-structural-nested-models.html#cb99-25" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.1646881  0.3705471   0.444  0.65672   </span></span>
+<span id="cb99-26"><a href="g-estimation-of-structural-nested-models.html#cb99-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4 -0.1384470  0.5697969  -0.243  0.80802   </span></span>
+<span id="cb99-27"><a href="g-estimation-of-structural-nested-models.html#cb99-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.3823818  0.5601808   0.683  0.49486   </span></span>
+<span id="cb99-28"><a href="g-estimation-of-structural-nested-models.html#cb99-28" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.0157119  0.0347319  -0.452  0.65100   </span></span>
+<span id="cb99-29"><a href="g-estimation-of-structural-nested-models.html#cb99-29" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.0001133  0.0006058   0.187  0.85171   </span></span>
+<span id="cb99-30"><a href="g-estimation-of-structural-nested-models.html#cb99-30" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.0785973  0.0749576  -1.049  0.29438   </span></span>
+<span id="cb99-31"><a href="g-estimation-of-structural-nested-models.html#cb99-31" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.0005569  0.0010318   0.540  0.58938   </span></span>
+<span id="cb99-32"><a href="g-estimation-of-structural-nested-models.html#cb99-32" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.9714714  0.3878101   2.505  0.01224 * </span></span>
+<span id="cb99-33"><a href="g-estimation-of-structural-nested-models.html#cb99-33" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.5839890  0.3723133   1.569  0.11675   </span></span>
+<span id="cb99-34"><a href="g-estimation-of-structural-nested-models.html#cb99-34" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.2474785  0.3254548   0.760  0.44701   </span></span>
+<span id="cb99-35"><a href="g-estimation-of-structural-nested-models.html#cb99-35" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2    -0.7065829  0.3964577  -1.782  0.07471 . </span></span>
+<span id="cb99-36"><a href="g-estimation-of-structural-nested-models.html#cb99-36" tabindex="-1"></a><span class="co">#&gt; wt71                   0.0878871  0.0400115   2.197  0.02805 * </span></span>
+<span id="cb99-37"><a href="g-estimation-of-structural-nested-models.html#cb99-37" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)             -0.0006351  0.0002257  -2.813  0.00490 **</span></span>
+<span id="cb99-38"><a href="g-estimation-of-structural-nested-models.html#cb99-38" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb99-39"><a href="g-estimation-of-structural-nested-models.html#cb99-39" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb99-40"><a href="g-estimation-of-structural-nested-models.html#cb99-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb99-41"><a href="g-estimation-of-structural-nested-models.html#cb99-41" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb99-42"><a href="g-estimation-of-structural-nested-models.html#cb99-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb99-43"><a href="g-estimation-of-structural-nested-models.html#cb99-43" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
+<span id="cb99-44"><a href="g-estimation-of-structural-nested-models.html#cb99-44" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 465.36  on 1609  degrees of freedom</span></span>
+<span id="cb99-45"><a href="g-estimation-of-structural-nested-models.html#cb99-45" tabindex="-1"></a><span class="co">#&gt; AIC: 505.36</span></span>
+<span id="cb99-46"><a href="g-estimation-of-structural-nested-models.html#cb99-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb99-47"><a href="g-estimation-of-structural-nested-models.html#cb99-47" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 7</span></span></code></pre></div>
+<div class="sourceCode" id="cb100"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb100-1"><a href="g-estimation-of-structural-nested-models.html#cb100-1" tabindex="-1"></a>nhefs<span class="sc">$</span>pd.c <span class="ot">&lt;-</span> <span class="fu">predict</span>(cw.denom, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb100-2"><a href="g-estimation-of-structural-nested-models.html#cb100-2" tabindex="-1"></a>nhefs<span class="sc">$</span>wc <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>cens<span class="sc">==</span><span class="dv">0</span>, <span class="dv">1</span><span class="sc">/</span>nhefs<span class="sc">$</span>pd.c, <span class="cn">NA</span>)</span>
+<span id="cb100-3"><a href="g-estimation-of-structural-nested-models.html#cb100-3" tabindex="-1"></a><span class="co"># observations with cens=1 only contribute to censoring models</span></span></code></pre></div>
 </div>
 <div id="program-14.2" class="section level2 hasAnchor">
 <h2>Program 14.2<a href="g-estimation-of-structural-nested-models.html#program-14.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -401,144 +401,144 @@ <h2>Program 14.2<a href="g-estimation-of-structural-nested-models.html#program-1
 </ul>
 <div id="g-estimation-checking-one-possible-value-of-psi" class="section level3 hasAnchor">
 <h3>G-estimation: Checking one possible value of psi<a href="g-estimation-of-structural-nested-models.html#g-estimation-checking-one-possible-value-of-psi" class="anchor-section" aria-label="Anchor link to header"></a></h3>
-<div class="sourceCode" id="cb25"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb25-1"><a href="g-estimation-of-structural-nested-models.html#cb25-1" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;)</span></span>
-<span id="cb25-2"><a href="g-estimation-of-structural-nested-models.html#cb25-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
-<span id="cb25-3"><a href="g-estimation-of-structural-nested-models.html#cb25-3" tabindex="-1"></a></span>
-<span id="cb25-4"><a href="g-estimation-of-structural-nested-models.html#cb25-4" tabindex="-1"></a>nhefs<span class="sc">$</span>psi <span class="ot">&lt;-</span> <span class="fl">3.446</span></span>
-<span id="cb25-5"><a href="g-estimation-of-structural-nested-models.html#cb25-5" tabindex="-1"></a>nhefs<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>wt82_71 <span class="sc">-</span> nhefs<span class="sc">$</span>psi<span class="sc">*</span>nhefs<span class="sc">$</span>qsmk</span>
-<span id="cb25-6"><a href="g-estimation-of-structural-nested-models.html#cb25-6" tabindex="-1"></a></span>
-<span id="cb25-7"><a href="g-estimation-of-structural-nested-models.html#cb25-7" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb25-8"><a href="g-estimation-of-structural-nested-models.html#cb25-8" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb25-9"><a href="g-estimation-of-structural-nested-models.html#cb25-9" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb25-10"><a href="g-estimation-of-structural-nested-models.html#cb25-10" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> Hpsi, <span class="at">family=</span>binomial, <span class="at">data=</span>nhefs,</span>
-<span id="cb25-11"><a href="g-estimation-of-structural-nested-models.html#cb25-11" tabindex="-1"></a>           <span class="at">weights=</span>wc, <span class="at">id=</span>seqn, <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
-<span id="cb25-12"><a href="g-estimation-of-structural-nested-models.html#cb25-12" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb25-13"><a href="g-estimation-of-structural-nested-models.html#cb25-13" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
-<span id="cb25-14"><a href="g-estimation-of-structural-nested-models.html#cb25-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb25-15"><a href="g-estimation-of-structural-nested-models.html#cb25-15" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb25-16"><a href="g-estimation-of-structural-nested-models.html#cb25-16" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + </span></span>
-<span id="cb25-17"><a href="g-estimation-of-structural-nested-models.html#cb25-17" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + </span></span>
-<span id="cb25-18"><a href="g-estimation-of-structural-nested-models.html#cb25-18" tabindex="-1"></a><span class="co">#&gt;     I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb25-19"><a href="g-estimation-of-structural-nested-models.html#cb25-19" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71 * wt71) + Hpsi, family = binomial, data = nhefs, </span></span>
-<span id="cb25-20"><a href="g-estimation-of-structural-nested-models.html#cb25-20" tabindex="-1"></a><span class="co">#&gt;     weights = wc, id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb25-21"><a href="g-estimation-of-structural-nested-models.html#cb25-21" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb25-22"><a href="g-estimation-of-structural-nested-models.html#cb25-22" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb25-23"><a href="g-estimation-of-structural-nested-models.html#cb25-23" tabindex="-1"></a><span class="co">#&gt;                                      Estimate    Std.err   Wald Pr(&gt;|W|)    </span></span>
-<span id="cb25-24"><a href="g-estimation-of-structural-nested-models.html#cb25-24" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -2.403e+00  1.329e+00  3.269 0.070604 .  </span></span>
-<span id="cb25-25"><a href="g-estimation-of-structural-nested-models.html#cb25-25" tabindex="-1"></a><span class="co">#&gt; sex                                -5.137e-01  1.536e-01 11.193 0.000821 ***</span></span>
-<span id="cb25-26"><a href="g-estimation-of-structural-nested-models.html#cb25-26" tabindex="-1"></a><span class="co">#&gt; race                               -8.609e-01  2.099e-01 16.826 4.10e-05 ***</span></span>
-<span id="cb25-27"><a href="g-estimation-of-structural-nested-models.html#cb25-27" tabindex="-1"></a><span class="co">#&gt; age                                 1.152e-01  5.020e-02  5.263 0.021779 *  </span></span>
-<span id="cb25-28"><a href="g-estimation-of-structural-nested-models.html#cb25-28" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -7.593e-04  5.296e-04  2.056 0.151619    </span></span>
-<span id="cb25-29"><a href="g-estimation-of-structural-nested-models.html#cb25-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2              -2.894e-02  1.964e-01  0.022 0.882859    </span></span>
-<span id="cb25-30"><a href="g-estimation-of-structural-nested-models.html#cb25-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               8.771e-02  1.726e-01  0.258 0.611329    </span></span>
-<span id="cb25-31"><a href="g-estimation-of-structural-nested-models.html#cb25-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               6.637e-02  2.698e-01  0.061 0.805645    </span></span>
-<span id="cb25-32"><a href="g-estimation-of-structural-nested-models.html#cb25-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               4.711e-01  2.247e-01  4.395 0.036036 *  </span></span>
-<span id="cb25-33"><a href="g-estimation-of-structural-nested-models.html#cb25-33" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -7.834e-02  1.464e-02 28.635 8.74e-08 ***</span></span>
-<span id="cb25-34"><a href="g-estimation-of-structural-nested-models.html#cb25-34" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity)  1.072e-03  2.650e-04 16.368 5.21e-05 ***</span></span>
-<span id="cb25-35"><a href="g-estimation-of-structural-nested-models.html#cb25-35" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -7.111e-02  2.639e-02  7.261 0.007047 ** </span></span>
-<span id="cb25-36"><a href="g-estimation-of-structural-nested-models.html#cb25-36" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)              8.153e-04  4.490e-04  3.298 0.069384 .  </span></span>
-<span id="cb25-37"><a href="g-estimation-of-structural-nested-models.html#cb25-37" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                3.363e-01  1.828e-01  3.384 0.065844 .  </span></span>
-<span id="cb25-38"><a href="g-estimation-of-structural-nested-models.html#cb25-38" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                3.800e-01  1.889e-01  4.049 0.044187 *  </span></span>
-<span id="cb25-39"><a href="g-estimation-of-structural-nested-models.html#cb25-39" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                  3.412e-02  1.339e-01  0.065 0.798778    </span></span>
-<span id="cb25-40"><a href="g-estimation-of-structural-nested-models.html#cb25-40" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                  2.135e-01  2.121e-01  1.012 0.314308    </span></span>
-<span id="cb25-41"><a href="g-estimation-of-structural-nested-models.html#cb25-41" tabindex="-1"></a><span class="co">#&gt; wt71                               -7.661e-03  2.562e-02  0.089 0.764963    </span></span>
-<span id="cb25-42"><a href="g-estimation-of-structural-nested-models.html#cb25-42" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                      8.655e-05  1.582e-04  0.299 0.584233    </span></span>
-<span id="cb25-43"><a href="g-estimation-of-structural-nested-models.html#cb25-43" tabindex="-1"></a><span class="co">#&gt; Hpsi                               -1.903e-06  8.839e-03  0.000 0.999828    </span></span>
-<span id="cb25-44"><a href="g-estimation-of-structural-nested-models.html#cb25-44" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb25-45"><a href="g-estimation-of-structural-nested-models.html#cb25-45" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb25-46"><a href="g-estimation-of-structural-nested-models.html#cb25-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb25-47"><a href="g-estimation-of-structural-nested-models.html#cb25-47" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb25-48"><a href="g-estimation-of-structural-nested-models.html#cb25-48" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb25-49"><a href="g-estimation-of-structural-nested-models.html#cb25-49" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb25-50"><a href="g-estimation-of-structural-nested-models.html#cb25-50" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb25-51"><a href="g-estimation-of-structural-nested-models.html#cb25-51" tabindex="-1"></a><span class="co">#&gt; (Intercept)   0.9969 0.06717</span></span>
-<span id="cb25-52"><a href="g-estimation-of-structural-nested-models.html#cb25-52" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb101"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb101-1"><a href="g-estimation-of-structural-nested-models.html#cb101-1" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;)</span></span>
+<span id="cb101-2"><a href="g-estimation-of-structural-nested-models.html#cb101-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
+<span id="cb101-3"><a href="g-estimation-of-structural-nested-models.html#cb101-3" tabindex="-1"></a></span>
+<span id="cb101-4"><a href="g-estimation-of-structural-nested-models.html#cb101-4" tabindex="-1"></a>nhefs<span class="sc">$</span>psi <span class="ot">&lt;-</span> <span class="fl">3.446</span></span>
+<span id="cb101-5"><a href="g-estimation-of-structural-nested-models.html#cb101-5" tabindex="-1"></a>nhefs<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>wt82_71 <span class="sc">-</span> nhefs<span class="sc">$</span>psi<span class="sc">*</span>nhefs<span class="sc">$</span>qsmk</span>
+<span id="cb101-6"><a href="g-estimation-of-structural-nested-models.html#cb101-6" tabindex="-1"></a></span>
+<span id="cb101-7"><a href="g-estimation-of-structural-nested-models.html#cb101-7" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb101-8"><a href="g-estimation-of-structural-nested-models.html#cb101-8" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb101-9"><a href="g-estimation-of-structural-nested-models.html#cb101-9" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb101-10"><a href="g-estimation-of-structural-nested-models.html#cb101-10" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> Hpsi, <span class="at">family=</span>binomial, <span class="at">data=</span>nhefs,</span>
+<span id="cb101-11"><a href="g-estimation-of-structural-nested-models.html#cb101-11" tabindex="-1"></a>           <span class="at">weights=</span>wc, <span class="at">id=</span>seqn, <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
+<span id="cb101-12"><a href="g-estimation-of-structural-nested-models.html#cb101-12" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span></code></pre></div>
+<div class="sourceCode" id="cb102"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb102-1"><a href="g-estimation-of-structural-nested-models.html#cb102-1" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
+<span id="cb102-2"><a href="g-estimation-of-structural-nested-models.html#cb102-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb102-3"><a href="g-estimation-of-structural-nested-models.html#cb102-3" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb102-4"><a href="g-estimation-of-structural-nested-models.html#cb102-4" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + </span></span>
+<span id="cb102-5"><a href="g-estimation-of-structural-nested-models.html#cb102-5" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + </span></span>
+<span id="cb102-6"><a href="g-estimation-of-structural-nested-models.html#cb102-6" tabindex="-1"></a><span class="co">#&gt;     I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb102-7"><a href="g-estimation-of-structural-nested-models.html#cb102-7" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71 * wt71) + Hpsi, family = binomial, data = nhefs, </span></span>
+<span id="cb102-8"><a href="g-estimation-of-structural-nested-models.html#cb102-8" tabindex="-1"></a><span class="co">#&gt;     weights = wc, id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb102-9"><a href="g-estimation-of-structural-nested-models.html#cb102-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb102-10"><a href="g-estimation-of-structural-nested-models.html#cb102-10" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb102-11"><a href="g-estimation-of-structural-nested-models.html#cb102-11" tabindex="-1"></a><span class="co">#&gt;                                      Estimate    Std.err   Wald Pr(&gt;|W|)    </span></span>
+<span id="cb102-12"><a href="g-estimation-of-structural-nested-models.html#cb102-12" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -2.403e+00  1.329e+00  3.269 0.070604 .  </span></span>
+<span id="cb102-13"><a href="g-estimation-of-structural-nested-models.html#cb102-13" tabindex="-1"></a><span class="co">#&gt; sex                                -5.137e-01  1.536e-01 11.193 0.000821 ***</span></span>
+<span id="cb102-14"><a href="g-estimation-of-structural-nested-models.html#cb102-14" tabindex="-1"></a><span class="co">#&gt; race                               -8.609e-01  2.099e-01 16.826 4.10e-05 ***</span></span>
+<span id="cb102-15"><a href="g-estimation-of-structural-nested-models.html#cb102-15" tabindex="-1"></a><span class="co">#&gt; age                                 1.152e-01  5.020e-02  5.263 0.021779 *  </span></span>
+<span id="cb102-16"><a href="g-estimation-of-structural-nested-models.html#cb102-16" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -7.593e-04  5.296e-04  2.056 0.151619    </span></span>
+<span id="cb102-17"><a href="g-estimation-of-structural-nested-models.html#cb102-17" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2              -2.894e-02  1.964e-01  0.022 0.882859    </span></span>
+<span id="cb102-18"><a href="g-estimation-of-structural-nested-models.html#cb102-18" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               8.771e-02  1.726e-01  0.258 0.611329    </span></span>
+<span id="cb102-19"><a href="g-estimation-of-structural-nested-models.html#cb102-19" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               6.637e-02  2.698e-01  0.061 0.805645    </span></span>
+<span id="cb102-20"><a href="g-estimation-of-structural-nested-models.html#cb102-20" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               4.711e-01  2.247e-01  4.395 0.036036 *  </span></span>
+<span id="cb102-21"><a href="g-estimation-of-structural-nested-models.html#cb102-21" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -7.834e-02  1.464e-02 28.635 8.74e-08 ***</span></span>
+<span id="cb102-22"><a href="g-estimation-of-structural-nested-models.html#cb102-22" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity)  1.072e-03  2.650e-04 16.368 5.21e-05 ***</span></span>
+<span id="cb102-23"><a href="g-estimation-of-structural-nested-models.html#cb102-23" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -7.111e-02  2.639e-02  7.261 0.007047 ** </span></span>
+<span id="cb102-24"><a href="g-estimation-of-structural-nested-models.html#cb102-24" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)              8.153e-04  4.490e-04  3.298 0.069384 .  </span></span>
+<span id="cb102-25"><a href="g-estimation-of-structural-nested-models.html#cb102-25" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                3.363e-01  1.828e-01  3.384 0.065844 .  </span></span>
+<span id="cb102-26"><a href="g-estimation-of-structural-nested-models.html#cb102-26" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                3.800e-01  1.889e-01  4.049 0.044187 *  </span></span>
+<span id="cb102-27"><a href="g-estimation-of-structural-nested-models.html#cb102-27" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                  3.412e-02  1.339e-01  0.065 0.798778    </span></span>
+<span id="cb102-28"><a href="g-estimation-of-structural-nested-models.html#cb102-28" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                  2.135e-01  2.121e-01  1.012 0.314308    </span></span>
+<span id="cb102-29"><a href="g-estimation-of-structural-nested-models.html#cb102-29" tabindex="-1"></a><span class="co">#&gt; wt71                               -7.661e-03  2.562e-02  0.089 0.764963    </span></span>
+<span id="cb102-30"><a href="g-estimation-of-structural-nested-models.html#cb102-30" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                      8.655e-05  1.582e-04  0.299 0.584233    </span></span>
+<span id="cb102-31"><a href="g-estimation-of-structural-nested-models.html#cb102-31" tabindex="-1"></a><span class="co">#&gt; Hpsi                               -1.903e-06  8.839e-03  0.000 0.999828    </span></span>
+<span id="cb102-32"><a href="g-estimation-of-structural-nested-models.html#cb102-32" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb102-33"><a href="g-estimation-of-structural-nested-models.html#cb102-33" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb102-34"><a href="g-estimation-of-structural-nested-models.html#cb102-34" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb102-35"><a href="g-estimation-of-structural-nested-models.html#cb102-35" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb102-36"><a href="g-estimation-of-structural-nested-models.html#cb102-36" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb102-37"><a href="g-estimation-of-structural-nested-models.html#cb102-37" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb102-38"><a href="g-estimation-of-structural-nested-models.html#cb102-38" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb102-39"><a href="g-estimation-of-structural-nested-models.html#cb102-39" tabindex="-1"></a><span class="co">#&gt; (Intercept)   0.9969 0.06717</span></span>
+<span id="cb102-40"><a href="g-estimation-of-structural-nested-models.html#cb102-40" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
 </div>
 <div id="g-estimation-checking-multiple-possible-values-of-psi" class="section level3 hasAnchor">
 <h3>G-estimation: Checking multiple possible values of psi<a href="g-estimation-of-structural-nested-models.html#g-estimation-checking-multiple-possible-values-of-psi" class="anchor-section" aria-label="Anchor link to header"></a></h3>
-<div class="sourceCode" id="cb26"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb26-1"><a href="g-estimation-of-structural-nested-models.html#cb26-1" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;)</span></span>
-<span id="cb26-2"><a href="g-estimation-of-structural-nested-models.html#cb26-2" tabindex="-1"></a>grid <span class="ot">&lt;-</span> <span class="fu">seq</span>(<span class="at">from =</span> <span class="dv">2</span>,<span class="at">to =</span> <span class="dv">5</span>, <span class="at">by =</span> <span class="fl">0.1</span>)</span>
-<span id="cb26-3"><a href="g-estimation-of-structural-nested-models.html#cb26-3" tabindex="-1"></a>j <span class="ot">=</span> <span class="dv">0</span></span>
-<span id="cb26-4"><a href="g-estimation-of-structural-nested-models.html#cb26-4" tabindex="-1"></a>Hpsi.coefs <span class="ot">&lt;-</span> <span class="fu">cbind</span>(<span class="fu">rep</span>(<span class="cn">NA</span>,<span class="fu">length</span>(grid)), <span class="fu">rep</span>(<span class="cn">NA</span>, <span class="fu">length</span>(grid)))</span>
-<span id="cb26-5"><a href="g-estimation-of-structural-nested-models.html#cb26-5" tabindex="-1"></a><span class="fu">colnames</span>(Hpsi.coefs) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;Estimate&quot;</span>, <span class="st">&quot;p-value&quot;</span>)</span>
-<span id="cb26-6"><a href="g-estimation-of-structural-nested-models.html#cb26-6" tabindex="-1"></a></span>
-<span id="cb26-7"><a href="g-estimation-of-structural-nested-models.html#cb26-7" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> grid){</span>
-<span id="cb26-8"><a href="g-estimation-of-structural-nested-models.html#cb26-8" tabindex="-1"></a>  psi <span class="ot">=</span> i</span>
-<span id="cb26-9"><a href="g-estimation-of-structural-nested-models.html#cb26-9" tabindex="-1"></a>  j <span class="ot">=</span> j<span class="sc">+</span><span class="dv">1</span></span>
-<span id="cb26-10"><a href="g-estimation-of-structural-nested-models.html#cb26-10" tabindex="-1"></a>  nhefs<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>wt82_71 <span class="sc">-</span> psi <span class="sc">*</span> nhefs<span class="sc">$</span>qsmk</span>
-<span id="cb26-11"><a href="g-estimation-of-structural-nested-models.html#cb26-11" tabindex="-1"></a></span>
-<span id="cb26-12"><a href="g-estimation-of-structural-nested-models.html#cb26-12" tabindex="-1"></a>  gest.fit <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb26-13"><a href="g-estimation-of-structural-nested-models.html#cb26-13" tabindex="-1"></a>                  <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb26-14"><a href="g-estimation-of-structural-nested-models.html#cb26-14" tabindex="-1"></a>                  <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb26-15"><a href="g-estimation-of-structural-nested-models.html#cb26-15" tabindex="-1"></a>                  <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> Hpsi, <span class="at">family=</span>binomial, <span class="at">data=</span>nhefs,</span>
-<span id="cb26-16"><a href="g-estimation-of-structural-nested-models.html#cb26-16" tabindex="-1"></a>                  <span class="at">weights=</span>wc, <span class="at">id=</span>seqn, <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
-<span id="cb26-17"><a href="g-estimation-of-structural-nested-models.html#cb26-17" tabindex="-1"></a>  Hpsi.coefs[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="fu">summary</span>(gest.fit)<span class="sc">$</span>coefficients[<span class="st">&quot;Hpsi&quot;</span>, <span class="st">&quot;Estimate&quot;</span>]</span>
-<span id="cb26-18"><a href="g-estimation-of-structural-nested-models.html#cb26-18" tabindex="-1"></a>  Hpsi.coefs[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="fu">summary</span>(gest.fit)<span class="sc">$</span>coefficients[<span class="st">&quot;Hpsi&quot;</span>, <span class="st">&quot;Pr(&gt;|W|)&quot;</span>]</span>
-<span id="cb26-19"><a href="g-estimation-of-structural-nested-models.html#cb26-19" tabindex="-1"></a>}</span>
-<span id="cb26-20"><a href="g-estimation-of-structural-nested-models.html#cb26-20" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-21"><a href="g-estimation-of-structural-nested-models.html#cb26-21" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-22"><a href="g-estimation-of-structural-nested-models.html#cb26-22" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-23"><a href="g-estimation-of-structural-nested-models.html#cb26-23" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-24"><a href="g-estimation-of-structural-nested-models.html#cb26-24" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-25"><a href="g-estimation-of-structural-nested-models.html#cb26-25" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-26"><a href="g-estimation-of-structural-nested-models.html#cb26-26" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-27"><a href="g-estimation-of-structural-nested-models.html#cb26-27" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-28"><a href="g-estimation-of-structural-nested-models.html#cb26-28" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-29"><a href="g-estimation-of-structural-nested-models.html#cb26-29" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-30"><a href="g-estimation-of-structural-nested-models.html#cb26-30" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-31"><a href="g-estimation-of-structural-nested-models.html#cb26-31" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-32"><a href="g-estimation-of-structural-nested-models.html#cb26-32" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-33"><a href="g-estimation-of-structural-nested-models.html#cb26-33" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-34"><a href="g-estimation-of-structural-nested-models.html#cb26-34" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-35"><a href="g-estimation-of-structural-nested-models.html#cb26-35" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-36"><a href="g-estimation-of-structural-nested-models.html#cb26-36" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-37"><a href="g-estimation-of-structural-nested-models.html#cb26-37" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-38"><a href="g-estimation-of-structural-nested-models.html#cb26-38" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-39"><a href="g-estimation-of-structural-nested-models.html#cb26-39" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-40"><a href="g-estimation-of-structural-nested-models.html#cb26-40" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-41"><a href="g-estimation-of-structural-nested-models.html#cb26-41" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-42"><a href="g-estimation-of-structural-nested-models.html#cb26-42" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-43"><a href="g-estimation-of-structural-nested-models.html#cb26-43" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-44"><a href="g-estimation-of-structural-nested-models.html#cb26-44" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-45"><a href="g-estimation-of-structural-nested-models.html#cb26-45" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-46"><a href="g-estimation-of-structural-nested-models.html#cb26-46" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-47"><a href="g-estimation-of-structural-nested-models.html#cb26-47" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-48"><a href="g-estimation-of-structural-nested-models.html#cb26-48" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-49"><a href="g-estimation-of-structural-nested-models.html#cb26-49" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-50"><a href="g-estimation-of-structural-nested-models.html#cb26-50" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb26-51"><a href="g-estimation-of-structural-nested-models.html#cb26-51" tabindex="-1"></a>Hpsi.coefs</span>
-<span id="cb26-52"><a href="g-estimation-of-structural-nested-models.html#cb26-52" tabindex="-1"></a><span class="co">#&gt;         Estimate  p-value</span></span>
-<span id="cb26-53"><a href="g-estimation-of-structural-nested-models.html#cb26-53" tabindex="-1"></a><span class="co">#&gt;  [1,]  0.0267219 0.001772</span></span>
-<span id="cb26-54"><a href="g-estimation-of-structural-nested-models.html#cb26-54" tabindex="-1"></a><span class="co">#&gt;  [2,]  0.0248946 0.003580</span></span>
-<span id="cb26-55"><a href="g-estimation-of-structural-nested-models.html#cb26-55" tabindex="-1"></a><span class="co">#&gt;  [3,]  0.0230655 0.006963</span></span>
-<span id="cb26-56"><a href="g-estimation-of-structural-nested-models.html#cb26-56" tabindex="-1"></a><span class="co">#&gt;  [4,]  0.0212344 0.013026</span></span>
-<span id="cb26-57"><a href="g-estimation-of-structural-nested-models.html#cb26-57" tabindex="-1"></a><span class="co">#&gt;  [5,]  0.0194009 0.023417</span></span>
-<span id="cb26-58"><a href="g-estimation-of-structural-nested-models.html#cb26-58" tabindex="-1"></a><span class="co">#&gt;  [6,]  0.0175647 0.040430</span></span>
-<span id="cb26-59"><a href="g-estimation-of-structural-nested-models.html#cb26-59" tabindex="-1"></a><span class="co">#&gt;  [7,]  0.0157254 0.067015</span></span>
-<span id="cb26-60"><a href="g-estimation-of-structural-nested-models.html#cb26-60" tabindex="-1"></a><span class="co">#&gt;  [8,]  0.0138827 0.106626</span></span>
-<span id="cb26-61"><a href="g-estimation-of-structural-nested-models.html#cb26-61" tabindex="-1"></a><span class="co">#&gt;  [9,]  0.0120362 0.162877</span></span>
-<span id="cb26-62"><a href="g-estimation-of-structural-nested-models.html#cb26-62" tabindex="-1"></a><span class="co">#&gt; [10,]  0.0101857 0.238979</span></span>
-<span id="cb26-63"><a href="g-estimation-of-structural-nested-models.html#cb26-63" tabindex="-1"></a><span class="co">#&gt; [11,]  0.0083308 0.337048</span></span>
-<span id="cb26-64"><a href="g-estimation-of-structural-nested-models.html#cb26-64" tabindex="-1"></a><span class="co">#&gt; [12,]  0.0064713 0.457433</span></span>
-<span id="cb26-65"><a href="g-estimation-of-structural-nested-models.html#cb26-65" tabindex="-1"></a><span class="co">#&gt; [13,]  0.0046069 0.598235</span></span>
-<span id="cb26-66"><a href="g-estimation-of-structural-nested-models.html#cb26-66" tabindex="-1"></a><span class="co">#&gt; [14,]  0.0027374 0.755204</span></span>
-<span id="cb26-67"><a href="g-estimation-of-structural-nested-models.html#cb26-67" tabindex="-1"></a><span class="co">#&gt; [15,]  0.0008624 0.922101</span></span>
-<span id="cb26-68"><a href="g-estimation-of-structural-nested-models.html#cb26-68" tabindex="-1"></a><span class="co">#&gt; [16,] -0.0010181 0.908537</span></span>
-<span id="cb26-69"><a href="g-estimation-of-structural-nested-models.html#cb26-69" tabindex="-1"></a><span class="co">#&gt; [17,] -0.0029044 0.744362</span></span>
-<span id="cb26-70"><a href="g-estimation-of-structural-nested-models.html#cb26-70" tabindex="-1"></a><span class="co">#&gt; [18,] -0.0047967 0.592188</span></span>
-<span id="cb26-71"><a href="g-estimation-of-structural-nested-models.html#cb26-71" tabindex="-1"></a><span class="co">#&gt; [19,] -0.0066950 0.457169</span></span>
-<span id="cb26-72"><a href="g-estimation-of-structural-nested-models.html#cb26-72" tabindex="-1"></a><span class="co">#&gt; [20,] -0.0085997 0.342360</span></span>
-<span id="cb26-73"><a href="g-estimation-of-structural-nested-models.html#cb26-73" tabindex="-1"></a><span class="co">#&gt; [21,] -0.0105107 0.248681</span></span>
-<span id="cb26-74"><a href="g-estimation-of-structural-nested-models.html#cb26-74" tabindex="-1"></a><span class="co">#&gt; [22,] -0.0124282 0.175239</span></span>
-<span id="cb26-75"><a href="g-estimation-of-structural-nested-models.html#cb26-75" tabindex="-1"></a><span class="co">#&gt; [23,] -0.0143523 0.119841</span></span>
-<span id="cb26-76"><a href="g-estimation-of-structural-nested-models.html#cb26-76" tabindex="-1"></a><span class="co">#&gt; [24,] -0.0162831 0.079580</span></span>
-<span id="cb26-77"><a href="g-estimation-of-structural-nested-models.html#cb26-77" tabindex="-1"></a><span class="co">#&gt; [25,] -0.0182206 0.051347</span></span>
-<span id="cb26-78"><a href="g-estimation-of-structural-nested-models.html#cb26-78" tabindex="-1"></a><span class="co">#&gt; [26,] -0.0201649 0.032218</span></span>
-<span id="cb26-79"><a href="g-estimation-of-structural-nested-models.html#cb26-79" tabindex="-1"></a><span class="co">#&gt; [27,] -0.0221160 0.019675</span></span>
-<span id="cb26-80"><a href="g-estimation-of-structural-nested-models.html#cb26-80" tabindex="-1"></a><span class="co">#&gt; [28,] -0.0240740 0.011706</span></span>
-<span id="cb26-81"><a href="g-estimation-of-structural-nested-models.html#cb26-81" tabindex="-1"></a><span class="co">#&gt; [29,] -0.0260389 0.006792</span></span>
-<span id="cb26-82"><a href="g-estimation-of-structural-nested-models.html#cb26-82" tabindex="-1"></a><span class="co">#&gt; [30,] -0.0280106 0.003847</span></span>
-<span id="cb26-83"><a href="g-estimation-of-structural-nested-models.html#cb26-83" tabindex="-1"></a><span class="co">#&gt; [31,] -0.0299893 0.002129</span></span></code></pre></div>
+<div class="sourceCode" id="cb103"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb103-1"><a href="g-estimation-of-structural-nested-models.html#cb103-1" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;)</span></span>
+<span id="cb103-2"><a href="g-estimation-of-structural-nested-models.html#cb103-2" tabindex="-1"></a>grid <span class="ot">&lt;-</span> <span class="fu">seq</span>(<span class="at">from =</span> <span class="dv">2</span>,<span class="at">to =</span> <span class="dv">5</span>, <span class="at">by =</span> <span class="fl">0.1</span>)</span>
+<span id="cb103-3"><a href="g-estimation-of-structural-nested-models.html#cb103-3" tabindex="-1"></a>j <span class="ot">=</span> <span class="dv">0</span></span>
+<span id="cb103-4"><a href="g-estimation-of-structural-nested-models.html#cb103-4" tabindex="-1"></a>Hpsi.coefs <span class="ot">&lt;-</span> <span class="fu">cbind</span>(<span class="fu">rep</span>(<span class="cn">NA</span>,<span class="fu">length</span>(grid)), <span class="fu">rep</span>(<span class="cn">NA</span>, <span class="fu">length</span>(grid)))</span>
+<span id="cb103-5"><a href="g-estimation-of-structural-nested-models.html#cb103-5" tabindex="-1"></a><span class="fu">colnames</span>(Hpsi.coefs) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;Estimate&quot;</span>, <span class="st">&quot;p-value&quot;</span>)</span>
+<span id="cb103-6"><a href="g-estimation-of-structural-nested-models.html#cb103-6" tabindex="-1"></a></span>
+<span id="cb103-7"><a href="g-estimation-of-structural-nested-models.html#cb103-7" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> grid){</span>
+<span id="cb103-8"><a href="g-estimation-of-structural-nested-models.html#cb103-8" tabindex="-1"></a>  psi <span class="ot">=</span> i</span>
+<span id="cb103-9"><a href="g-estimation-of-structural-nested-models.html#cb103-9" tabindex="-1"></a>  j <span class="ot">=</span> j<span class="sc">+</span><span class="dv">1</span></span>
+<span id="cb103-10"><a href="g-estimation-of-structural-nested-models.html#cb103-10" tabindex="-1"></a>  nhefs<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>wt82_71 <span class="sc">-</span> psi <span class="sc">*</span> nhefs<span class="sc">$</span>qsmk</span>
+<span id="cb103-11"><a href="g-estimation-of-structural-nested-models.html#cb103-11" tabindex="-1"></a></span>
+<span id="cb103-12"><a href="g-estimation-of-structural-nested-models.html#cb103-12" tabindex="-1"></a>  gest.fit <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb103-13"><a href="g-estimation-of-structural-nested-models.html#cb103-13" tabindex="-1"></a>                  <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb103-14"><a href="g-estimation-of-structural-nested-models.html#cb103-14" tabindex="-1"></a>                  <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb103-15"><a href="g-estimation-of-structural-nested-models.html#cb103-15" tabindex="-1"></a>                  <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> Hpsi, <span class="at">family=</span>binomial, <span class="at">data=</span>nhefs,</span>
+<span id="cb103-16"><a href="g-estimation-of-structural-nested-models.html#cb103-16" tabindex="-1"></a>                  <span class="at">weights=</span>wc, <span class="at">id=</span>seqn, <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
+<span id="cb103-17"><a href="g-estimation-of-structural-nested-models.html#cb103-17" tabindex="-1"></a>  Hpsi.coefs[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="fu">summary</span>(gest.fit)<span class="sc">$</span>coefficients[<span class="st">&quot;Hpsi&quot;</span>, <span class="st">&quot;Estimate&quot;</span>]</span>
+<span id="cb103-18"><a href="g-estimation-of-structural-nested-models.html#cb103-18" tabindex="-1"></a>  Hpsi.coefs[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="fu">summary</span>(gest.fit)<span class="sc">$</span>coefficients[<span class="st">&quot;Hpsi&quot;</span>, <span class="st">&quot;Pr(&gt;|W|)&quot;</span>]</span>
+<span id="cb103-19"><a href="g-estimation-of-structural-nested-models.html#cb103-19" tabindex="-1"></a>}</span>
+<span id="cb103-20"><a href="g-estimation-of-structural-nested-models.html#cb103-20" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-21"><a href="g-estimation-of-structural-nested-models.html#cb103-21" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-22"><a href="g-estimation-of-structural-nested-models.html#cb103-22" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-23"><a href="g-estimation-of-structural-nested-models.html#cb103-23" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-24"><a href="g-estimation-of-structural-nested-models.html#cb103-24" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-25"><a href="g-estimation-of-structural-nested-models.html#cb103-25" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-26"><a href="g-estimation-of-structural-nested-models.html#cb103-26" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-27"><a href="g-estimation-of-structural-nested-models.html#cb103-27" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-28"><a href="g-estimation-of-structural-nested-models.html#cb103-28" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-29"><a href="g-estimation-of-structural-nested-models.html#cb103-29" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-30"><a href="g-estimation-of-structural-nested-models.html#cb103-30" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-31"><a href="g-estimation-of-structural-nested-models.html#cb103-31" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-32"><a href="g-estimation-of-structural-nested-models.html#cb103-32" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-33"><a href="g-estimation-of-structural-nested-models.html#cb103-33" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-34"><a href="g-estimation-of-structural-nested-models.html#cb103-34" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-35"><a href="g-estimation-of-structural-nested-models.html#cb103-35" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-36"><a href="g-estimation-of-structural-nested-models.html#cb103-36" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-37"><a href="g-estimation-of-structural-nested-models.html#cb103-37" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-38"><a href="g-estimation-of-structural-nested-models.html#cb103-38" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-39"><a href="g-estimation-of-structural-nested-models.html#cb103-39" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-40"><a href="g-estimation-of-structural-nested-models.html#cb103-40" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-41"><a href="g-estimation-of-structural-nested-models.html#cb103-41" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-42"><a href="g-estimation-of-structural-nested-models.html#cb103-42" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-43"><a href="g-estimation-of-structural-nested-models.html#cb103-43" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-44"><a href="g-estimation-of-structural-nested-models.html#cb103-44" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-45"><a href="g-estimation-of-structural-nested-models.html#cb103-45" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-46"><a href="g-estimation-of-structural-nested-models.html#cb103-46" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-47"><a href="g-estimation-of-structural-nested-models.html#cb103-47" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-48"><a href="g-estimation-of-structural-nested-models.html#cb103-48" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-49"><a href="g-estimation-of-structural-nested-models.html#cb103-49" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
+<span id="cb103-50"><a href="g-estimation-of-structural-nested-models.html#cb103-50" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span></code></pre></div>
+<div class="sourceCode" id="cb104"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb104-1"><a href="g-estimation-of-structural-nested-models.html#cb104-1" tabindex="-1"></a>Hpsi.coefs</span>
+<span id="cb104-2"><a href="g-estimation-of-structural-nested-models.html#cb104-2" tabindex="-1"></a><span class="co">#&gt;         Estimate  p-value</span></span>
+<span id="cb104-3"><a href="g-estimation-of-structural-nested-models.html#cb104-3" tabindex="-1"></a><span class="co">#&gt;  [1,]  0.0267219 0.001772</span></span>
+<span id="cb104-4"><a href="g-estimation-of-structural-nested-models.html#cb104-4" tabindex="-1"></a><span class="co">#&gt;  [2,]  0.0248946 0.003580</span></span>
+<span id="cb104-5"><a href="g-estimation-of-structural-nested-models.html#cb104-5" tabindex="-1"></a><span class="co">#&gt;  [3,]  0.0230655 0.006963</span></span>
+<span id="cb104-6"><a href="g-estimation-of-structural-nested-models.html#cb104-6" tabindex="-1"></a><span class="co">#&gt;  [4,]  0.0212344 0.013026</span></span>
+<span id="cb104-7"><a href="g-estimation-of-structural-nested-models.html#cb104-7" tabindex="-1"></a><span class="co">#&gt;  [5,]  0.0194009 0.023417</span></span>
+<span id="cb104-8"><a href="g-estimation-of-structural-nested-models.html#cb104-8" tabindex="-1"></a><span class="co">#&gt;  [6,]  0.0175647 0.040430</span></span>
+<span id="cb104-9"><a href="g-estimation-of-structural-nested-models.html#cb104-9" tabindex="-1"></a><span class="co">#&gt;  [7,]  0.0157254 0.067015</span></span>
+<span id="cb104-10"><a href="g-estimation-of-structural-nested-models.html#cb104-10" tabindex="-1"></a><span class="co">#&gt;  [8,]  0.0138827 0.106626</span></span>
+<span id="cb104-11"><a href="g-estimation-of-structural-nested-models.html#cb104-11" tabindex="-1"></a><span class="co">#&gt;  [9,]  0.0120362 0.162877</span></span>
+<span id="cb104-12"><a href="g-estimation-of-structural-nested-models.html#cb104-12" tabindex="-1"></a><span class="co">#&gt; [10,]  0.0101857 0.238979</span></span>
+<span id="cb104-13"><a href="g-estimation-of-structural-nested-models.html#cb104-13" tabindex="-1"></a><span class="co">#&gt; [11,]  0.0083308 0.337048</span></span>
+<span id="cb104-14"><a href="g-estimation-of-structural-nested-models.html#cb104-14" tabindex="-1"></a><span class="co">#&gt; [12,]  0.0064713 0.457433</span></span>
+<span id="cb104-15"><a href="g-estimation-of-structural-nested-models.html#cb104-15" tabindex="-1"></a><span class="co">#&gt; [13,]  0.0046069 0.598235</span></span>
+<span id="cb104-16"><a href="g-estimation-of-structural-nested-models.html#cb104-16" tabindex="-1"></a><span class="co">#&gt; [14,]  0.0027374 0.755204</span></span>
+<span id="cb104-17"><a href="g-estimation-of-structural-nested-models.html#cb104-17" tabindex="-1"></a><span class="co">#&gt; [15,]  0.0008624 0.922101</span></span>
+<span id="cb104-18"><a href="g-estimation-of-structural-nested-models.html#cb104-18" tabindex="-1"></a><span class="co">#&gt; [16,] -0.0010181 0.908537</span></span>
+<span id="cb104-19"><a href="g-estimation-of-structural-nested-models.html#cb104-19" tabindex="-1"></a><span class="co">#&gt; [17,] -0.0029044 0.744362</span></span>
+<span id="cb104-20"><a href="g-estimation-of-structural-nested-models.html#cb104-20" tabindex="-1"></a><span class="co">#&gt; [18,] -0.0047967 0.592188</span></span>
+<span id="cb104-21"><a href="g-estimation-of-structural-nested-models.html#cb104-21" tabindex="-1"></a><span class="co">#&gt; [19,] -0.0066950 0.457169</span></span>
+<span id="cb104-22"><a href="g-estimation-of-structural-nested-models.html#cb104-22" tabindex="-1"></a><span class="co">#&gt; [20,] -0.0085997 0.342360</span></span>
+<span id="cb104-23"><a href="g-estimation-of-structural-nested-models.html#cb104-23" tabindex="-1"></a><span class="co">#&gt; [21,] -0.0105107 0.248681</span></span>
+<span id="cb104-24"><a href="g-estimation-of-structural-nested-models.html#cb104-24" tabindex="-1"></a><span class="co">#&gt; [22,] -0.0124282 0.175239</span></span>
+<span id="cb104-25"><a href="g-estimation-of-structural-nested-models.html#cb104-25" tabindex="-1"></a><span class="co">#&gt; [23,] -0.0143523 0.119841</span></span>
+<span id="cb104-26"><a href="g-estimation-of-structural-nested-models.html#cb104-26" tabindex="-1"></a><span class="co">#&gt; [24,] -0.0162831 0.079580</span></span>
+<span id="cb104-27"><a href="g-estimation-of-structural-nested-models.html#cb104-27" tabindex="-1"></a><span class="co">#&gt; [25,] -0.0182206 0.051347</span></span>
+<span id="cb104-28"><a href="g-estimation-of-structural-nested-models.html#cb104-28" tabindex="-1"></a><span class="co">#&gt; [26,] -0.0201649 0.032218</span></span>
+<span id="cb104-29"><a href="g-estimation-of-structural-nested-models.html#cb104-29" tabindex="-1"></a><span class="co">#&gt; [27,] -0.0221160 0.019675</span></span>
+<span id="cb104-30"><a href="g-estimation-of-structural-nested-models.html#cb104-30" tabindex="-1"></a><span class="co">#&gt; [28,] -0.0240740 0.011706</span></span>
+<span id="cb104-31"><a href="g-estimation-of-structural-nested-models.html#cb104-31" tabindex="-1"></a><span class="co">#&gt; [29,] -0.0260389 0.006792</span></span>
+<span id="cb104-32"><a href="g-estimation-of-structural-nested-models.html#cb104-32" tabindex="-1"></a><span class="co">#&gt; [30,] -0.0280106 0.003847</span></span>
+<span id="cb104-33"><a href="g-estimation-of-structural-nested-models.html#cb104-33" tabindex="-1"></a><span class="co">#&gt; [31,] -0.0299893 0.002129</span></span></code></pre></div>
 </div>
 </div>
 <div id="program-14.3" class="section level2 hasAnchor">
@@ -550,94 +550,94 @@ <h2>Program 14.3<a href="g-estimation-of-structural-nested-models.html#program-1
 </ul>
 <div id="g-estimation-closed-form-estimator-linear-mean-models" class="section level3 hasAnchor">
 <h3>G-estimation: Closed form estimator linear mean models<a href="g-estimation-of-structural-nested-models.html#g-estimation-closed-form-estimator-linear-mean-models" class="anchor-section" aria-label="Anchor link to header"></a></h3>
-<div class="sourceCode" id="cb27"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb27-1"><a href="g-estimation-of-structural-nested-models.html#cb27-1" tabindex="-1"></a>logit.est <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb27-2"><a href="g-estimation-of-structural-nested-models.html#cb27-2" tabindex="-1"></a>                 <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> smokeyrs</span>
-<span id="cb27-3"><a href="g-estimation-of-structural-nested-models.html#cb27-3" tabindex="-1"></a>                 <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb27-4"><a href="g-estimation-of-structural-nested-models.html#cb27-4" tabindex="-1"></a>                 <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">^</span><span class="dv">2</span>), <span class="at">data =</span> nhefs, <span class="at">weight =</span> wc,</span>
-<span id="cb27-5"><a href="g-estimation-of-structural-nested-models.html#cb27-5" tabindex="-1"></a>                 <span class="at">family =</span> <span class="fu">binomial</span>())</span>
-<span id="cb27-6"><a href="g-estimation-of-structural-nested-models.html#cb27-6" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb27-7"><a href="g-estimation-of-structural-nested-models.html#cb27-7" tabindex="-1"></a><span class="fu">summary</span>(logit.est)</span>
-<span id="cb27-8"><a href="g-estimation-of-structural-nested-models.html#cb27-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-9"><a href="g-estimation-of-structural-nested-models.html#cb27-9" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb27-10"><a href="g-estimation-of-structural-nested-models.html#cb27-10" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + </span></span>
-<span id="cb27-11"><a href="g-estimation-of-structural-nested-models.html#cb27-11" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + </span></span>
-<span id="cb27-12"><a href="g-estimation-of-structural-nested-models.html#cb27-12" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), </span></span>
-<span id="cb27-13"><a href="g-estimation-of-structural-nested-models.html#cb27-13" tabindex="-1"></a><span class="co">#&gt;     family = binomial(), data = nhefs, weights = wc)</span></span>
-<span id="cb27-14"><a href="g-estimation-of-structural-nested-models.html#cb27-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-15"><a href="g-estimation-of-structural-nested-models.html#cb27-15" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb27-16"><a href="g-estimation-of-structural-nested-models.html#cb27-16" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb27-17"><a href="g-estimation-of-structural-nested-models.html#cb27-17" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.40e+00   1.31e+00   -1.83  0.06743 .  </span></span>
-<span id="cb27-18"><a href="g-estimation-of-structural-nested-models.html#cb27-18" tabindex="-1"></a><span class="co">#&gt; sex                   -5.14e-01   1.50e-01   -3.42  0.00062 ***</span></span>
-<span id="cb27-19"><a href="g-estimation-of-structural-nested-models.html#cb27-19" tabindex="-1"></a><span class="co">#&gt; race                  -8.61e-01   2.06e-01   -4.18  2.9e-05 ***</span></span>
-<span id="cb27-20"><a href="g-estimation-of-structural-nested-models.html#cb27-20" tabindex="-1"></a><span class="co">#&gt; age                    1.15e-01   4.95e-02    2.33  0.01992 *  </span></span>
-<span id="cb27-21"><a href="g-estimation-of-structural-nested-models.html#cb27-21" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -7.59e-04   5.14e-04   -1.48  0.13953    </span></span>
-<span id="cb27-22"><a href="g-estimation-of-structural-nested-models.html#cb27-22" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -2.89e-02   1.93e-01   -0.15  0.88079    </span></span>
-<span id="cb27-23"><a href="g-estimation-of-structural-nested-models.html#cb27-23" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  8.77e-02   1.73e-01    0.51  0.61244    </span></span>
-<span id="cb27-24"><a href="g-estimation-of-structural-nested-models.html#cb27-24" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  6.64e-02   2.66e-01    0.25  0.80301    </span></span>
-<span id="cb27-25"><a href="g-estimation-of-structural-nested-models.html#cb27-25" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  4.71e-01   2.21e-01    2.13  0.03314 *  </span></span>
-<span id="cb27-26"><a href="g-estimation-of-structural-nested-models.html#cb27-26" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -7.83e-02   1.49e-02   -5.27  1.4e-07 ***</span></span>
-<span id="cb27-27"><a href="g-estimation-of-structural-nested-models.html#cb27-27" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    1.07e-03   2.78e-04    3.85  0.00012 ***</span></span>
-<span id="cb27-28"><a href="g-estimation-of-structural-nested-models.html#cb27-28" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -7.11e-02   2.71e-02   -2.63  0.00862 ** </span></span>
-<span id="cb27-29"><a href="g-estimation-of-structural-nested-models.html#cb27-29" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          8.15e-04   4.45e-04    1.83  0.06722 .  </span></span>
-<span id="cb27-30"><a href="g-estimation-of-structural-nested-models.html#cb27-30" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   3.36e-01   1.75e-01    1.92  0.05467 .  </span></span>
-<span id="cb27-31"><a href="g-estimation-of-structural-nested-models.html#cb27-31" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   3.80e-01   1.82e-01    2.09  0.03637 *  </span></span>
-<span id="cb27-32"><a href="g-estimation-of-structural-nested-models.html#cb27-32" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     3.41e-02   1.30e-01    0.26  0.79337    </span></span>
-<span id="cb27-33"><a href="g-estimation-of-structural-nested-models.html#cb27-33" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     2.13e-01   2.06e-01    1.04  0.30033    </span></span>
-<span id="cb27-34"><a href="g-estimation-of-structural-nested-models.html#cb27-34" tabindex="-1"></a><span class="co">#&gt; wt71                  -7.66e-03   2.46e-02   -0.31  0.75530    </span></span>
-<span id="cb27-35"><a href="g-estimation-of-structural-nested-models.html#cb27-35" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              8.66e-05   1.51e-04    0.57  0.56586    </span></span>
-<span id="cb27-36"><a href="g-estimation-of-structural-nested-models.html#cb27-36" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb27-37"><a href="g-estimation-of-structural-nested-models.html#cb27-37" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb27-38"><a href="g-estimation-of-structural-nested-models.html#cb27-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-39"><a href="g-estimation-of-structural-nested-models.html#cb27-39" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb27-40"><a href="g-estimation-of-structural-nested-models.html#cb27-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-41"><a href="g-estimation-of-structural-nested-models.html#cb27-41" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1872.2  on 1565  degrees of freedom</span></span>
-<span id="cb27-42"><a href="g-estimation-of-structural-nested-models.html#cb27-42" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1755.6  on 1547  degrees of freedom</span></span>
-<span id="cb27-43"><a href="g-estimation-of-structural-nested-models.html#cb27-43" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb27-44"><a href="g-estimation-of-structural-nested-models.html#cb27-44" tabindex="-1"></a><span class="co">#&gt; AIC: 1719</span></span>
-<span id="cb27-45"><a href="g-estimation-of-structural-nested-models.html#cb27-45" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-46"><a href="g-estimation-of-structural-nested-models.html#cb27-46" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb27-47"><a href="g-estimation-of-structural-nested-models.html#cb27-47" tabindex="-1"></a>nhefs<span class="sc">$</span>pqsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(logit.est, nhefs, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb27-48"><a href="g-estimation-of-structural-nested-models.html#cb27-48" tabindex="-1"></a><span class="fu">describe</span>(nhefs<span class="sc">$</span>pqsmk)</span>
-<span id="cb27-49"><a href="g-estimation-of-structural-nested-models.html#cb27-49" tabindex="-1"></a><span class="co">#&gt; nhefs$pqsmk </span></span>
-<span id="cb27-50"><a href="g-estimation-of-structural-nested-models.html#cb27-50" tabindex="-1"></a><span class="co">#&gt;        n  missing distinct     Info     Mean      Gmd      .05      .10 </span></span>
-<span id="cb27-51"><a href="g-estimation-of-structural-nested-models.html#cb27-51" tabindex="-1"></a><span class="co">#&gt;     1629        0     1629        1   0.2622   0.1302   0.1015   0.1261 </span></span>
-<span id="cb27-52"><a href="g-estimation-of-structural-nested-models.html#cb27-52" tabindex="-1"></a><span class="co">#&gt;      .25      .50      .75      .90      .95 </span></span>
-<span id="cb27-53"><a href="g-estimation-of-structural-nested-models.html#cb27-53" tabindex="-1"></a><span class="co">#&gt;   0.1780   0.2426   0.3251   0.4221   0.4965 </span></span>
-<span id="cb27-54"><a href="g-estimation-of-structural-nested-models.html#cb27-54" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb27-55"><a href="g-estimation-of-structural-nested-models.html#cb27-55" tabindex="-1"></a><span class="co">#&gt; lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059</span></span>
-<span id="cb27-56"><a href="g-estimation-of-structural-nested-models.html#cb27-56" tabindex="-1"></a><span class="co">#&gt; highest: 0.672083  0.686432  0.713913  0.733299  0.78914</span></span>
-<span id="cb27-57"><a href="g-estimation-of-structural-nested-models.html#cb27-57" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>pqsmk)</span>
-<span id="cb27-58"><a href="g-estimation-of-structural-nested-models.html#cb27-58" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb27-59"><a href="g-estimation-of-structural-nested-models.html#cb27-59" tabindex="-1"></a><span class="co">#&gt;  0.0514  0.1780  0.2426  0.2622  0.3251  0.7891</span></span>
-<span id="cb27-60"><a href="g-estimation-of-structural-nested-models.html#cb27-60" tabindex="-1"></a></span>
-<span id="cb27-61"><a href="g-estimation-of-structural-nested-models.html#cb27-61" tabindex="-1"></a><span class="co"># solve sum(w_c * H(psi) * (qsmk - E[qsmk | L]))  = 0</span></span>
-<span id="cb27-62"><a href="g-estimation-of-structural-nested-models.html#cb27-62" tabindex="-1"></a><span class="co"># for a single psi and H(psi) = wt82_71 - psi * qsmk</span></span>
-<span id="cb27-63"><a href="g-estimation-of-structural-nested-models.html#cb27-63" tabindex="-1"></a><span class="co"># this can be solved as</span></span>
-<span id="cb27-64"><a href="g-estimation-of-structural-nested-models.html#cb27-64" tabindex="-1"></a><span class="co"># psi = sum( w_c * wt82_71 * (qsmk - pqsmk)) / sum(w_c * qsmk * (qsmk - pqsmk))</span></span>
-<span id="cb27-65"><a href="g-estimation-of-structural-nested-models.html#cb27-65" tabindex="-1"></a></span>
-<span id="cb27-66"><a href="g-estimation-of-structural-nested-models.html#cb27-66" tabindex="-1"></a>nhefs.c <span class="ot">&lt;-</span> nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82)),]</span>
-<span id="cb27-67"><a href="g-estimation-of-structural-nested-models.html#cb27-67" tabindex="-1"></a><span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wc<span class="sc">*</span>wt82_71<span class="sc">*</span>(qsmk<span class="sc">-</span>pqsmk)) <span class="sc">/</span> <span class="fu">sum</span>(wc<span class="sc">*</span>qsmk<span class="sc">*</span>(qsmk <span class="sc">-</span> pqsmk)))</span>
-<span id="cb27-68"><a href="g-estimation-of-structural-nested-models.html#cb27-68" tabindex="-1"></a><span class="co">#&gt; [1] 3.446</span></span></code></pre></div>
+<div class="sourceCode" id="cb105"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb105-1"><a href="g-estimation-of-structural-nested-models.html#cb105-1" tabindex="-1"></a>logit.est <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb105-2"><a href="g-estimation-of-structural-nested-models.html#cb105-2" tabindex="-1"></a>                 <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> smokeyrs</span>
+<span id="cb105-3"><a href="g-estimation-of-structural-nested-models.html#cb105-3" tabindex="-1"></a>                 <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">^</span><span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb105-4"><a href="g-estimation-of-structural-nested-models.html#cb105-4" tabindex="-1"></a>                 <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">^</span><span class="dv">2</span>), <span class="at">data =</span> nhefs, <span class="at">weight =</span> wc,</span>
+<span id="cb105-5"><a href="g-estimation-of-structural-nested-models.html#cb105-5" tabindex="-1"></a>                 <span class="at">family =</span> <span class="fu">binomial</span>())</span>
+<span id="cb105-6"><a href="g-estimation-of-structural-nested-models.html#cb105-6" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span></code></pre></div>
+<div class="sourceCode" id="cb106"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb106-1"><a href="g-estimation-of-structural-nested-models.html#cb106-1" tabindex="-1"></a><span class="fu">summary</span>(logit.est)</span>
+<span id="cb106-2"><a href="g-estimation-of-structural-nested-models.html#cb106-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb106-3"><a href="g-estimation-of-structural-nested-models.html#cb106-3" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb106-4"><a href="g-estimation-of-structural-nested-models.html#cb106-4" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + </span></span>
+<span id="cb106-5"><a href="g-estimation-of-structural-nested-models.html#cb106-5" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + </span></span>
+<span id="cb106-6"><a href="g-estimation-of-structural-nested-models.html#cb106-6" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), </span></span>
+<span id="cb106-7"><a href="g-estimation-of-structural-nested-models.html#cb106-7" tabindex="-1"></a><span class="co">#&gt;     family = binomial(), data = nhefs, weights = wc)</span></span>
+<span id="cb106-8"><a href="g-estimation-of-structural-nested-models.html#cb106-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb106-9"><a href="g-estimation-of-structural-nested-models.html#cb106-9" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb106-10"><a href="g-estimation-of-structural-nested-models.html#cb106-10" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb106-11"><a href="g-estimation-of-structural-nested-models.html#cb106-11" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.40e+00   1.31e+00   -1.83  0.06743 .  </span></span>
+<span id="cb106-12"><a href="g-estimation-of-structural-nested-models.html#cb106-12" tabindex="-1"></a><span class="co">#&gt; sex                   -5.14e-01   1.50e-01   -3.42  0.00062 ***</span></span>
+<span id="cb106-13"><a href="g-estimation-of-structural-nested-models.html#cb106-13" tabindex="-1"></a><span class="co">#&gt; race                  -8.61e-01   2.06e-01   -4.18  2.9e-05 ***</span></span>
+<span id="cb106-14"><a href="g-estimation-of-structural-nested-models.html#cb106-14" tabindex="-1"></a><span class="co">#&gt; age                    1.15e-01   4.95e-02    2.33  0.01992 *  </span></span>
+<span id="cb106-15"><a href="g-estimation-of-structural-nested-models.html#cb106-15" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -7.59e-04   5.14e-04   -1.48  0.13953    </span></span>
+<span id="cb106-16"><a href="g-estimation-of-structural-nested-models.html#cb106-16" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -2.89e-02   1.93e-01   -0.15  0.88079    </span></span>
+<span id="cb106-17"><a href="g-estimation-of-structural-nested-models.html#cb106-17" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  8.77e-02   1.73e-01    0.51  0.61244    </span></span>
+<span id="cb106-18"><a href="g-estimation-of-structural-nested-models.html#cb106-18" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  6.64e-02   2.66e-01    0.25  0.80301    </span></span>
+<span id="cb106-19"><a href="g-estimation-of-structural-nested-models.html#cb106-19" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  4.71e-01   2.21e-01    2.13  0.03314 *  </span></span>
+<span id="cb106-20"><a href="g-estimation-of-structural-nested-models.html#cb106-20" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -7.83e-02   1.49e-02   -5.27  1.4e-07 ***</span></span>
+<span id="cb106-21"><a href="g-estimation-of-structural-nested-models.html#cb106-21" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    1.07e-03   2.78e-04    3.85  0.00012 ***</span></span>
+<span id="cb106-22"><a href="g-estimation-of-structural-nested-models.html#cb106-22" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -7.11e-02   2.71e-02   -2.63  0.00862 ** </span></span>
+<span id="cb106-23"><a href="g-estimation-of-structural-nested-models.html#cb106-23" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          8.15e-04   4.45e-04    1.83  0.06722 .  </span></span>
+<span id="cb106-24"><a href="g-estimation-of-structural-nested-models.html#cb106-24" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   3.36e-01   1.75e-01    1.92  0.05467 .  </span></span>
+<span id="cb106-25"><a href="g-estimation-of-structural-nested-models.html#cb106-25" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   3.80e-01   1.82e-01    2.09  0.03637 *  </span></span>
+<span id="cb106-26"><a href="g-estimation-of-structural-nested-models.html#cb106-26" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     3.41e-02   1.30e-01    0.26  0.79337    </span></span>
+<span id="cb106-27"><a href="g-estimation-of-structural-nested-models.html#cb106-27" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     2.13e-01   2.06e-01    1.04  0.30033    </span></span>
+<span id="cb106-28"><a href="g-estimation-of-structural-nested-models.html#cb106-28" tabindex="-1"></a><span class="co">#&gt; wt71                  -7.66e-03   2.46e-02   -0.31  0.75530    </span></span>
+<span id="cb106-29"><a href="g-estimation-of-structural-nested-models.html#cb106-29" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              8.66e-05   1.51e-04    0.57  0.56586    </span></span>
+<span id="cb106-30"><a href="g-estimation-of-structural-nested-models.html#cb106-30" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb106-31"><a href="g-estimation-of-structural-nested-models.html#cb106-31" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb106-32"><a href="g-estimation-of-structural-nested-models.html#cb106-32" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb106-33"><a href="g-estimation-of-structural-nested-models.html#cb106-33" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb106-34"><a href="g-estimation-of-structural-nested-models.html#cb106-34" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb106-35"><a href="g-estimation-of-structural-nested-models.html#cb106-35" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1872.2  on 1565  degrees of freedom</span></span>
+<span id="cb106-36"><a href="g-estimation-of-structural-nested-models.html#cb106-36" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1755.6  on 1547  degrees of freedom</span></span>
+<span id="cb106-37"><a href="g-estimation-of-structural-nested-models.html#cb106-37" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb106-38"><a href="g-estimation-of-structural-nested-models.html#cb106-38" tabindex="-1"></a><span class="co">#&gt; AIC: 1719</span></span>
+<span id="cb106-39"><a href="g-estimation-of-structural-nested-models.html#cb106-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb106-40"><a href="g-estimation-of-structural-nested-models.html#cb106-40" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb107"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb107-1"><a href="g-estimation-of-structural-nested-models.html#cb107-1" tabindex="-1"></a>nhefs<span class="sc">$</span>pqsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(logit.est, nhefs, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb107-2"><a href="g-estimation-of-structural-nested-models.html#cb107-2" tabindex="-1"></a><span class="fu">describe</span>(nhefs<span class="sc">$</span>pqsmk)</span>
+<span id="cb107-3"><a href="g-estimation-of-structural-nested-models.html#cb107-3" tabindex="-1"></a><span class="co">#&gt; nhefs$pqsmk </span></span>
+<span id="cb107-4"><a href="g-estimation-of-structural-nested-models.html#cb107-4" tabindex="-1"></a><span class="co">#&gt;        n  missing distinct     Info     Mean      Gmd      .05      .10 </span></span>
+<span id="cb107-5"><a href="g-estimation-of-structural-nested-models.html#cb107-5" tabindex="-1"></a><span class="co">#&gt;     1629        0     1629        1   0.2622   0.1302   0.1015   0.1261 </span></span>
+<span id="cb107-6"><a href="g-estimation-of-structural-nested-models.html#cb107-6" tabindex="-1"></a><span class="co">#&gt;      .25      .50      .75      .90      .95 </span></span>
+<span id="cb107-7"><a href="g-estimation-of-structural-nested-models.html#cb107-7" tabindex="-1"></a><span class="co">#&gt;   0.1780   0.2426   0.3251   0.4221   0.4965 </span></span>
+<span id="cb107-8"><a href="g-estimation-of-structural-nested-models.html#cb107-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb107-9"><a href="g-estimation-of-structural-nested-models.html#cb107-9" tabindex="-1"></a><span class="co">#&gt; lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059</span></span>
+<span id="cb107-10"><a href="g-estimation-of-structural-nested-models.html#cb107-10" tabindex="-1"></a><span class="co">#&gt; highest: 0.672083  0.686432  0.713913  0.733299  0.78914</span></span></code></pre></div>
+<div class="sourceCode" id="cb108"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb108-1"><a href="g-estimation-of-structural-nested-models.html#cb108-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>pqsmk)</span>
+<span id="cb108-2"><a href="g-estimation-of-structural-nested-models.html#cb108-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb108-3"><a href="g-estimation-of-structural-nested-models.html#cb108-3" tabindex="-1"></a><span class="co">#&gt;  0.0514  0.1780  0.2426  0.2622  0.3251  0.7891</span></span></code></pre></div>
+<div class="sourceCode" id="cb109"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb109-1"><a href="g-estimation-of-structural-nested-models.html#cb109-1" tabindex="-1"></a></span>
+<span id="cb109-2"><a href="g-estimation-of-structural-nested-models.html#cb109-2" tabindex="-1"></a><span class="co"># solve sum(w_c * H(psi) * (qsmk - E[qsmk | L]))  = 0</span></span>
+<span id="cb109-3"><a href="g-estimation-of-structural-nested-models.html#cb109-3" tabindex="-1"></a><span class="co"># for a single psi and H(psi) = wt82_71 - psi * qsmk</span></span>
+<span id="cb109-4"><a href="g-estimation-of-structural-nested-models.html#cb109-4" tabindex="-1"></a><span class="co"># this can be solved as</span></span>
+<span id="cb109-5"><a href="g-estimation-of-structural-nested-models.html#cb109-5" tabindex="-1"></a><span class="co"># psi = sum( w_c * wt82_71 * (qsmk - pqsmk)) / sum(w_c * qsmk * (qsmk - pqsmk))</span></span>
+<span id="cb109-6"><a href="g-estimation-of-structural-nested-models.html#cb109-6" tabindex="-1"></a></span>
+<span id="cb109-7"><a href="g-estimation-of-structural-nested-models.html#cb109-7" tabindex="-1"></a>nhefs.c <span class="ot">&lt;-</span> nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82)),]</span>
+<span id="cb109-8"><a href="g-estimation-of-structural-nested-models.html#cb109-8" tabindex="-1"></a><span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wc<span class="sc">*</span>wt82_71<span class="sc">*</span>(qsmk<span class="sc">-</span>pqsmk)) <span class="sc">/</span> <span class="fu">sum</span>(wc<span class="sc">*</span>qsmk<span class="sc">*</span>(qsmk <span class="sc">-</span> pqsmk)))</span>
+<span id="cb109-9"><a href="g-estimation-of-structural-nested-models.html#cb109-9" tabindex="-1"></a><span class="co">#&gt; [1] 3.446</span></span></code></pre></div>
 </div>
 <div id="g-estimation-closed-form-estimator-for-2-parameter-model" class="section level3 hasAnchor">
 <h3>G-estimation: Closed form estimator for 2-parameter model<a href="g-estimation-of-structural-nested-models.html#g-estimation-closed-form-estimator-for-2-parameter-model" class="anchor-section" aria-label="Anchor link to header"></a></h3>
-<div class="sourceCode" id="cb28"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb28-1"><a href="g-estimation-of-structural-nested-models.html#cb28-1" tabindex="-1"></a>diff <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, qsmk <span class="sc">-</span> pqsmk)</span>
-<span id="cb28-2"><a href="g-estimation-of-structural-nested-models.html#cb28-2" tabindex="-1"></a>diff2 <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, wc <span class="sc">*</span> diff)</span>
-<span id="cb28-3"><a href="g-estimation-of-structural-nested-models.html#cb28-3" tabindex="-1"></a></span>
-<span id="cb28-4"><a href="g-estimation-of-structural-nested-models.html#cb28-4" tabindex="-1"></a>lhs <span class="ot">=</span> <span class="fu">matrix</span>(<span class="dv">0</span>,<span class="dv">2</span>,<span class="dv">2</span>)</span>
-<span id="cb28-5"><a href="g-estimation-of-structural-nested-models.html#cb28-5" tabindex="-1"></a>lhs[<span class="dv">1</span>,<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> diff2))</span>
-<span id="cb28-6"><a href="g-estimation-of-structural-nested-models.html#cb28-6" tabindex="-1"></a>lhs[<span class="dv">1</span>,<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity  <span class="sc">*</span> diff2))</span>
-<span id="cb28-7"><a href="g-estimation-of-structural-nested-models.html#cb28-7" tabindex="-1"></a>lhs[<span class="dv">2</span>,<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
-<span id="cb28-8"><a href="g-estimation-of-structural-nested-models.html#cb28-8" tabindex="-1"></a>lhs[<span class="dv">2</span>,<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
-<span id="cb28-9"><a href="g-estimation-of-structural-nested-models.html#cb28-9" tabindex="-1"></a></span>
-<span id="cb28-10"><a href="g-estimation-of-structural-nested-models.html#cb28-10" tabindex="-1"></a>rhs <span class="ot">=</span> <span class="fu">matrix</span>(<span class="dv">0</span>,<span class="dv">2</span>,<span class="dv">1</span>)</span>
-<span id="cb28-11"><a href="g-estimation-of-structural-nested-models.html#cb28-11" tabindex="-1"></a>rhs[<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wt82_71 <span class="sc">*</span> diff2))</span>
-<span id="cb28-12"><a href="g-estimation-of-structural-nested-models.html#cb28-12" tabindex="-1"></a>rhs[<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wt82_71 <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
-<span id="cb28-13"><a href="g-estimation-of-structural-nested-models.html#cb28-13" tabindex="-1"></a></span>
-<span id="cb28-14"><a href="g-estimation-of-structural-nested-models.html#cb28-14" tabindex="-1"></a>psi <span class="ot">=</span> <span class="fu">t</span>(<span class="fu">solve</span>(lhs,rhs))</span>
-<span id="cb28-15"><a href="g-estimation-of-structural-nested-models.html#cb28-15" tabindex="-1"></a>psi</span>
-<span id="cb28-16"><a href="g-estimation-of-structural-nested-models.html#cb28-16" tabindex="-1"></a><span class="co">#&gt;       [,1]    [,2]</span></span>
-<span id="cb28-17"><a href="g-estimation-of-structural-nested-models.html#cb28-17" tabindex="-1"></a><span class="co">#&gt; [1,] 2.859 0.03004</span></span></code></pre></div>
+<div class="sourceCode" id="cb110"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb110-1"><a href="g-estimation-of-structural-nested-models.html#cb110-1" tabindex="-1"></a>diff <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, qsmk <span class="sc">-</span> pqsmk)</span>
+<span id="cb110-2"><a href="g-estimation-of-structural-nested-models.html#cb110-2" tabindex="-1"></a>diff2 <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, wc <span class="sc">*</span> diff)</span>
+<span id="cb110-3"><a href="g-estimation-of-structural-nested-models.html#cb110-3" tabindex="-1"></a></span>
+<span id="cb110-4"><a href="g-estimation-of-structural-nested-models.html#cb110-4" tabindex="-1"></a>lhs <span class="ot">=</span> <span class="fu">matrix</span>(<span class="dv">0</span>,<span class="dv">2</span>,<span class="dv">2</span>)</span>
+<span id="cb110-5"><a href="g-estimation-of-structural-nested-models.html#cb110-5" tabindex="-1"></a>lhs[<span class="dv">1</span>,<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> diff2))</span>
+<span id="cb110-6"><a href="g-estimation-of-structural-nested-models.html#cb110-6" tabindex="-1"></a>lhs[<span class="dv">1</span>,<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity  <span class="sc">*</span> diff2))</span>
+<span id="cb110-7"><a href="g-estimation-of-structural-nested-models.html#cb110-7" tabindex="-1"></a>lhs[<span class="dv">2</span>,<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
+<span id="cb110-8"><a href="g-estimation-of-structural-nested-models.html#cb110-8" tabindex="-1"></a>lhs[<span class="dv">2</span>,<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(qsmk <span class="sc">*</span> smokeintensity <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
+<span id="cb110-9"><a href="g-estimation-of-structural-nested-models.html#cb110-9" tabindex="-1"></a></span>
+<span id="cb110-10"><a href="g-estimation-of-structural-nested-models.html#cb110-10" tabindex="-1"></a>rhs <span class="ot">=</span> <span class="fu">matrix</span>(<span class="dv">0</span>,<span class="dv">2</span>,<span class="dv">1</span>)</span>
+<span id="cb110-11"><a href="g-estimation-of-structural-nested-models.html#cb110-11" tabindex="-1"></a>rhs[<span class="dv">1</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wt82_71 <span class="sc">*</span> diff2))</span>
+<span id="cb110-12"><a href="g-estimation-of-structural-nested-models.html#cb110-12" tabindex="-1"></a>rhs[<span class="dv">2</span>] <span class="ot">=</span> <span class="fu">with</span>(nhefs.c, <span class="fu">sum</span>(wt82_71 <span class="sc">*</span> smokeintensity <span class="sc">*</span> diff2))</span>
+<span id="cb110-13"><a href="g-estimation-of-structural-nested-models.html#cb110-13" tabindex="-1"></a></span>
+<span id="cb110-14"><a href="g-estimation-of-structural-nested-models.html#cb110-14" tabindex="-1"></a>psi <span class="ot">=</span> <span class="fu">t</span>(<span class="fu">solve</span>(lhs,rhs))</span>
+<span id="cb110-15"><a href="g-estimation-of-structural-nested-models.html#cb110-15" tabindex="-1"></a>psi</span>
+<span id="cb110-16"><a href="g-estimation-of-structural-nested-models.html#cb110-16" tabindex="-1"></a><span class="co">#&gt;       [,1]    [,2]</span></span>
+<span id="cb110-17"><a href="g-estimation-of-structural-nested-models.html#cb110-17" tabindex="-1"></a><span class="co">#&gt; [1,] 2.859 0.03004</span></span></code></pre></div>
 
 </div>
 </div>
diff --git a/docs/index.html b/docs/index.html
index ee55915..81bd448 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -314,7 +314,7 @@ <h1 class="title">Causal Inference: What If. R and Stata code for Exercises</h1>
 <p class="author"><em>R code by Joy Shi and Sean McGrath</em></p>
 <p class="author"><em>Stata code by Eleanor Murray and Roger Logan</em></p>
 <p class="author"><em>R Markdown code by Tom Palmer</em></p>
-<p class="date"><em>25 April 2024</em></p>
+<p class="date"><em>16 June 2024</em></p>
 </div>
 <div id="preface" class="section level1 unnumbered hasAnchor">
 <h1>Preface<a href="index.html#preface" class="anchor-section" aria-label="Anchor link to header"></a></h1>
diff --git a/docs/index.md b/docs/index.md
index a38dab9..d2a1cd1 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -5,7 +5,7 @@ author:
  - R code by Joy Shi and Sean McGrath
  - Stata code by Eleanor Murray and Roger Logan
  - R Markdown code by Tom Palmer
-date: "25 April 2024"
+date: "16 June 2024"
 site: bookdown::bookdown_site
 documentclass: book
 #biblio-style: apalike
@@ -52,7 +52,7 @@ Either,
 ## Installing dependency packages
 It is easiest to open the repo in RStudio, as an RStudio project, by doubling click the `.Rproj` file. This makes sure that R's working directory is at the top level of the repo. If you don't want to open the repo as a project set the working directory to the top level of the repo directories using `setwd()`. Then run:
 
-```r
+``` r
 # install.packages("devtools") # uncomment if devtools not installed
 devtools::install_dev_deps()
 ```
@@ -61,12 +61,12 @@ devtools::install_dev_deps()
 We assume that you have downloaded the data from the Causal Inference Book website and saved it to a `data` subdirectory. You can do this manually or with the following code (nb. we use the [`here`](https://here.r-lib.org/) package to reference the data subdirectory).
 
 
-```r
+``` r
 library(here)
 ```
 
 
-```r
+``` r
 dataurls <- list()
 stub <- "https://cdn1.sph.harvard.edu/wp-content/uploads/sites/1268/"
 dataurls[[1]] <- paste0(stub, "2012/10/nhefs_sas.zip")
diff --git a/docs/instrumental-variables-estimation-stata.html b/docs/instrumental-variables-estimation-stata.html
index cda2238..810f0d9 100644
--- a/docs/instrumental-variables-estimation-stata.html
+++ b/docs/instrumental-variables-estimation-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="instrumental-variables-estimation-stata" class="section level1 unnumbered hasAnchor">
 <h1>16. Instrumental variables estimation: Stata<a href="instrumental-variables-estimation-stata.html#instrumental-variables-estimation-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb112"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb112-1"><a href="instrumental-variables-estimation-stata.html#cb112-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb229"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb229-1"><a href="instrumental-variables-estimation-stata.html#cb229-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -324,68 +324,68 @@ <h2>Program 16.1<a href="instrumental-variables-estimation-stata.html#program-16
 <li>Data from NHEFS</li>
 <li>Section 16.2</li>
 </ul>
-<div class="sourceCode" id="cb114"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb114-1"><a href="instrumental-variables-estimation-stata.html#cb114-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb114-2"><a href="instrumental-variables-estimation-stata.html#cb114-2" tabindex="-1"></a></span>
-<span id="cb114-3"><a href="instrumental-variables-estimation-stata.html#cb114-3" tabindex="-1"></a><span class="kw">summarize</span> price82</span>
-<span id="cb114-4"><a href="instrumental-variables-estimation-stata.html#cb114-4" tabindex="-1"></a></span>
-<span id="cb114-5"><a href="instrumental-variables-estimation-stata.html#cb114-5" tabindex="-1"></a><span class="co">/* ignore subjects with missing outcome or missing instrument for simplicity*/</span></span>
-<span id="cb114-6"><a href="instrumental-variables-estimation-stata.html#cb114-6" tabindex="-1"></a><span class="kw">foreach</span> <span class="kw">var</span> <span class="kw">of</span> <span class="kw">varlist</span> wt82 price82 {</span>
-<span id="cb114-7"><a href="instrumental-variables-estimation-stata.html#cb114-7" tabindex="-1"></a>  <span class="kw">drop</span> <span class="kw">if</span> <span class="ot">`var&#39;</span>==.</span>
-<span id="cb114-8"><a href="instrumental-variables-estimation-stata.html#cb114-8" tabindex="-1"></a>}</span>
-<span id="cb114-9"><a href="instrumental-variables-estimation-stata.html#cb114-9" tabindex="-1"></a></span>
-<span id="cb114-10"><a href="instrumental-variables-estimation-stata.html#cb114-10" tabindex="-1"></a><span class="co">/*Create categorical instrument*/</span></span>
-<span id="cb114-11"><a href="instrumental-variables-estimation-stata.html#cb114-11" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> highprice = (price82 &gt; 1.5 &amp; price82 &lt; .)</span>
-<span id="cb114-12"><a href="instrumental-variables-estimation-stata.html#cb114-12" tabindex="-1"></a></span>
-<span id="cb114-13"><a href="instrumental-variables-estimation-stata.html#cb114-13" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">replace</span></span>
-<span id="cb114-14"><a href="instrumental-variables-estimation-stata.html#cb114-14" tabindex="-1"></a></span>
-<span id="cb114-15"><a href="instrumental-variables-estimation-stata.html#cb114-15" tabindex="-1"></a><span class="co">/*Calculate P[Z|A=a]*/</span></span>
-<span id="cb114-16"><a href="instrumental-variables-estimation-stata.html#cb114-16" tabindex="-1"></a><span class="kw">tab</span> highprice qsmk, <span class="ot">row</span></span>
-<span id="cb114-17"><a href="instrumental-variables-estimation-stata.html#cb114-17" tabindex="-1"></a></span>
-<span id="cb114-18"><a href="instrumental-variables-estimation-stata.html#cb114-18" tabindex="-1"></a><span class="co">/*Calculate P[Y|Z=z]*/</span></span>
-<span id="cb114-19"><a href="instrumental-variables-estimation-stata.html#cb114-19" tabindex="-1"></a><span class="kw">ttest</span> wt82_71, <span class="kw">by</span>(highprice)</span>
-<span id="cb114-20"><a href="instrumental-variables-estimation-stata.html#cb114-20" tabindex="-1"></a></span>
-<span id="cb114-21"><a href="instrumental-variables-estimation-stata.html#cb114-21" tabindex="-1"></a><span class="co">/*Final IV estimate, OPTION 1: Hand calculations*/</span></span>
-<span id="cb114-22"><a href="instrumental-variables-estimation-stata.html#cb114-22" tabindex="-1"></a><span class="co">/*Numerator: num = E[Y|Z=1] - E[Y|Z=0] = 2.686 - 2.536 = 0.150*/</span></span>
-<span id="cb114-23"><a href="instrumental-variables-estimation-stata.html#cb114-23" tabindex="-1"></a><span class="co">/*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = 0.258 - 0.195 = 0.063 */</span> </span>
-<span id="cb114-24"><a href="instrumental-variables-estimation-stata.html#cb114-24" tabindex="-1"></a><span class="co">/*IV estimator: E[Ya=1] - E[Ya=0] = </span></span>
-<span id="cb114-25"><a href="instrumental-variables-estimation-stata.html#cb114-25" tabindex="-1"></a><span class="co">(E[Y|Z=1]-E[Y|Z=0])/(P[A=1|Z=1]-P[A=1|Z=0]) = 0.150/0.063 = 2.397*/</span></span>
-<span id="cb114-26"><a href="instrumental-variables-estimation-stata.html#cb114-26" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;Numerator, E[Y|Z=1] - E[Y|Z=0] =&quot;</span>, 2.686 - 2.536</span>
-<span id="cb114-27"><a href="instrumental-variables-estimation-stata.html#cb114-27" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] =&quot;</span>, 0.258 - 0.195</span>
-<span id="cb114-28"><a href="instrumental-variables-estimation-stata.html#cb114-28" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;IV estimator =&quot;</span>, 0.150/0.063</span>
-<span id="cb114-29"><a href="instrumental-variables-estimation-stata.html#cb114-29" tabindex="-1"></a></span>
-<span id="cb114-30"><a href="instrumental-variables-estimation-stata.html#cb114-30" tabindex="-1"></a><span class="co">/*OPTION 2 2: automated calculation of instrument*/</span></span>
-<span id="cb114-31"><a href="instrumental-variables-estimation-stata.html#cb114-31" tabindex="-1"></a><span class="co">/*Calculate P[A=1|Z=z], for each value of the instrument, </span></span>
-<span id="cb114-32"><a href="instrumental-variables-estimation-stata.html#cb114-32" tabindex="-1"></a><span class="co">and store in a matrix*/</span></span>
-<span id="cb114-33"><a href="instrumental-variables-estimation-stata.html#cb114-33" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> qsmk <span class="kw">if</span> (highprice==0)</span>
-<span id="cb114-34"><a href="instrumental-variables-estimation-stata.html#cb114-34" tabindex="-1"></a><span class="fu">matrix</span> input pa = (<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb114-35"><a href="instrumental-variables-estimation-stata.html#cb114-35" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> qsmk <span class="kw">if</span> (highprice==1)</span>
-<span id="cb114-36"><a href="instrumental-variables-estimation-stata.html#cb114-36" tabindex="-1"></a><span class="fu">matrix</span> pa = (pa ,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb114-37"><a href="instrumental-variables-estimation-stata.html#cb114-37" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pa</span>
-<span id="cb114-38"><a href="instrumental-variables-estimation-stata.html#cb114-38" tabindex="-1"></a></span>
-<span id="cb114-39"><a href="instrumental-variables-estimation-stata.html#cb114-39" tabindex="-1"></a><span class="co">/*Calculate P[Y|Z=z], for each value of the instrument, </span></span>
-<span id="cb114-40"><a href="instrumental-variables-estimation-stata.html#cb114-40" tabindex="-1"></a><span class="co">and store in a second matrix*/</span></span>
-<span id="cb114-41"><a href="instrumental-variables-estimation-stata.html#cb114-41" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> wt82_71 <span class="kw">if</span> (highprice==0)</span>
-<span id="cb114-42"><a href="instrumental-variables-estimation-stata.html#cb114-42" tabindex="-1"></a><span class="fu">matrix</span> input ey = (<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb114-43"><a href="instrumental-variables-estimation-stata.html#cb114-43" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> wt82_71 <span class="kw">if</span> (highprice==1)</span>
-<span id="cb114-44"><a href="instrumental-variables-estimation-stata.html#cb114-44" tabindex="-1"></a><span class="fu">matrix</span> ey = (ey ,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb114-45"><a href="instrumental-variables-estimation-stata.html#cb114-45" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> ey</span>
-<span id="cb114-46"><a href="instrumental-variables-estimation-stata.html#cb114-46" tabindex="-1"></a></span>
-<span id="cb114-47"><a href="instrumental-variables-estimation-stata.html#cb114-47" tabindex="-1"></a><span class="co">/*Using Stata&#39;s built-in matrix manipulation feature (Mata), </span></span>
-<span id="cb114-48"><a href="instrumental-variables-estimation-stata.html#cb114-48" tabindex="-1"></a><span class="co">calculate numerator, denominator and IV estimator*/</span></span>
-<span id="cb114-49"><a href="instrumental-variables-estimation-stata.html#cb114-49" tabindex="-1"></a>*Numerator: num = E[Y|Z=1] - E[Y|Z=0]*<span class="kw">mata</span></span>
-<span id="cb114-50"><a href="instrumental-variables-estimation-stata.html#cb114-50" tabindex="-1"></a>*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0]*</span>
-<span id="cb114-51"><a href="instrumental-variables-estimation-stata.html#cb114-51" tabindex="-1"></a>*IV estimator: iv_est = IV estimate <span class="kw">of</span> E[Ya=1] - E[Ya=0] *</span>
-<span id="cb114-52"><a href="instrumental-variables-estimation-stata.html#cb114-52" tabindex="-1"></a><span class="kw">mata</span> </span>
-<span id="cb114-53"><a href="instrumental-variables-estimation-stata.html#cb114-53" tabindex="-1"></a>pa = st_matrix(<span class="st">&quot;pa&quot;</span>)</span>
-<span id="cb114-54"><a href="instrumental-variables-estimation-stata.html#cb114-54" tabindex="-1"></a>ey = st_matrix(<span class="st">&quot;ey&quot;</span>)</span>
-<span id="cb114-55"><a href="instrumental-variables-estimation-stata.html#cb114-55" tabindex="-1"></a>num = ey[1,2] - ey[1,1] </span>
-<span id="cb114-56"><a href="instrumental-variables-estimation-stata.html#cb114-56" tabindex="-1"></a>denom = pa[1,2] - pa[1,1]</span>
-<span id="cb114-57"><a href="instrumental-variables-estimation-stata.html#cb114-57" tabindex="-1"></a>iv_est = num / denom </span>
-<span id="cb114-58"><a href="instrumental-variables-estimation-stata.html#cb114-58" tabindex="-1"></a>num</span>
-<span id="cb114-59"><a href="instrumental-variables-estimation-stata.html#cb114-59" tabindex="-1"></a>denom</span>
-<span id="cb114-60"><a href="instrumental-variables-estimation-stata.html#cb114-60" tabindex="-1"></a>st_numscalar(<span class="st">&quot;iv_est&quot;</span>, iv_est)</span>
-<span id="cb114-61"><a href="instrumental-variables-estimation-stata.html#cb114-61" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb114-62"><a href="instrumental-variables-estimation-stata.html#cb114-62" tabindex="-1"></a><span class="kw">di</span> <span class="fu">scalar</span>(iv_est)</span></code></pre></div>
+<div class="sourceCode" id="cb231"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb231-1"><a href="instrumental-variables-estimation-stata.html#cb231-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb231-2"><a href="instrumental-variables-estimation-stata.html#cb231-2" tabindex="-1"></a></span>
+<span id="cb231-3"><a href="instrumental-variables-estimation-stata.html#cb231-3" tabindex="-1"></a><span class="kw">summarize</span> price82</span>
+<span id="cb231-4"><a href="instrumental-variables-estimation-stata.html#cb231-4" tabindex="-1"></a></span>
+<span id="cb231-5"><a href="instrumental-variables-estimation-stata.html#cb231-5" tabindex="-1"></a><span class="co">/* ignore subjects with missing outcome or missing instrument for simplicity*/</span></span>
+<span id="cb231-6"><a href="instrumental-variables-estimation-stata.html#cb231-6" tabindex="-1"></a><span class="kw">foreach</span> <span class="kw">var</span> <span class="kw">of</span> <span class="kw">varlist</span> wt82 price82 {</span>
+<span id="cb231-7"><a href="instrumental-variables-estimation-stata.html#cb231-7" tabindex="-1"></a>  <span class="kw">drop</span> <span class="kw">if</span> <span class="ot">`var&#39;</span>==.</span>
+<span id="cb231-8"><a href="instrumental-variables-estimation-stata.html#cb231-8" tabindex="-1"></a>}</span>
+<span id="cb231-9"><a href="instrumental-variables-estimation-stata.html#cb231-9" tabindex="-1"></a></span>
+<span id="cb231-10"><a href="instrumental-variables-estimation-stata.html#cb231-10" tabindex="-1"></a><span class="co">/*Create categorical instrument*/</span></span>
+<span id="cb231-11"><a href="instrumental-variables-estimation-stata.html#cb231-11" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> highprice = (price82 &gt; 1.5 &amp; price82 &lt; .)</span>
+<span id="cb231-12"><a href="instrumental-variables-estimation-stata.html#cb231-12" tabindex="-1"></a></span>
+<span id="cb231-13"><a href="instrumental-variables-estimation-stata.html#cb231-13" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">replace</span></span>
+<span id="cb231-14"><a href="instrumental-variables-estimation-stata.html#cb231-14" tabindex="-1"></a></span>
+<span id="cb231-15"><a href="instrumental-variables-estimation-stata.html#cb231-15" tabindex="-1"></a><span class="co">/*Calculate P[Z|A=a]*/</span></span>
+<span id="cb231-16"><a href="instrumental-variables-estimation-stata.html#cb231-16" tabindex="-1"></a><span class="kw">tab</span> highprice qsmk, <span class="ot">row</span></span>
+<span id="cb231-17"><a href="instrumental-variables-estimation-stata.html#cb231-17" tabindex="-1"></a></span>
+<span id="cb231-18"><a href="instrumental-variables-estimation-stata.html#cb231-18" tabindex="-1"></a><span class="co">/*Calculate P[Y|Z=z]*/</span></span>
+<span id="cb231-19"><a href="instrumental-variables-estimation-stata.html#cb231-19" tabindex="-1"></a><span class="kw">ttest</span> wt82_71, <span class="kw">by</span>(highprice)</span>
+<span id="cb231-20"><a href="instrumental-variables-estimation-stata.html#cb231-20" tabindex="-1"></a></span>
+<span id="cb231-21"><a href="instrumental-variables-estimation-stata.html#cb231-21" tabindex="-1"></a><span class="co">/*Final IV estimate, OPTION 1: Hand calculations*/</span></span>
+<span id="cb231-22"><a href="instrumental-variables-estimation-stata.html#cb231-22" tabindex="-1"></a><span class="co">/*Numerator: num = E[Y|Z=1] - E[Y|Z=0] = 2.686 - 2.536 = 0.150*/</span></span>
+<span id="cb231-23"><a href="instrumental-variables-estimation-stata.html#cb231-23" tabindex="-1"></a><span class="co">/*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = 0.258 - 0.195 = 0.063 */</span> </span>
+<span id="cb231-24"><a href="instrumental-variables-estimation-stata.html#cb231-24" tabindex="-1"></a><span class="co">/*IV estimator: E[Ya=1] - E[Ya=0] = </span></span>
+<span id="cb231-25"><a href="instrumental-variables-estimation-stata.html#cb231-25" tabindex="-1"></a><span class="co">(E[Y|Z=1]-E[Y|Z=0])/(P[A=1|Z=1]-P[A=1|Z=0]) = 0.150/0.063 = 2.397*/</span></span>
+<span id="cb231-26"><a href="instrumental-variables-estimation-stata.html#cb231-26" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;Numerator, E[Y|Z=1] - E[Y|Z=0] =&quot;</span>, 2.686 - 2.536</span>
+<span id="cb231-27"><a href="instrumental-variables-estimation-stata.html#cb231-27" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] =&quot;</span>, 0.258 - 0.195</span>
+<span id="cb231-28"><a href="instrumental-variables-estimation-stata.html#cb231-28" tabindex="-1"></a><span class="kw">display</span> <span class="st">&quot;IV estimator =&quot;</span>, 0.150/0.063</span>
+<span id="cb231-29"><a href="instrumental-variables-estimation-stata.html#cb231-29" tabindex="-1"></a></span>
+<span id="cb231-30"><a href="instrumental-variables-estimation-stata.html#cb231-30" tabindex="-1"></a><span class="co">/*OPTION 2 2: automated calculation of instrument*/</span></span>
+<span id="cb231-31"><a href="instrumental-variables-estimation-stata.html#cb231-31" tabindex="-1"></a><span class="co">/*Calculate P[A=1|Z=z], for each value of the instrument, </span></span>
+<span id="cb231-32"><a href="instrumental-variables-estimation-stata.html#cb231-32" tabindex="-1"></a><span class="co">and store in a matrix*/</span></span>
+<span id="cb231-33"><a href="instrumental-variables-estimation-stata.html#cb231-33" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> qsmk <span class="kw">if</span> (highprice==0)</span>
+<span id="cb231-34"><a href="instrumental-variables-estimation-stata.html#cb231-34" tabindex="-1"></a><span class="fu">matrix</span> input pa = (<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb231-35"><a href="instrumental-variables-estimation-stata.html#cb231-35" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> qsmk <span class="kw">if</span> (highprice==1)</span>
+<span id="cb231-36"><a href="instrumental-variables-estimation-stata.html#cb231-36" tabindex="-1"></a><span class="fu">matrix</span> pa = (pa ,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb231-37"><a href="instrumental-variables-estimation-stata.html#cb231-37" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pa</span>
+<span id="cb231-38"><a href="instrumental-variables-estimation-stata.html#cb231-38" tabindex="-1"></a></span>
+<span id="cb231-39"><a href="instrumental-variables-estimation-stata.html#cb231-39" tabindex="-1"></a><span class="co">/*Calculate P[Y|Z=z], for each value of the instrument, </span></span>
+<span id="cb231-40"><a href="instrumental-variables-estimation-stata.html#cb231-40" tabindex="-1"></a><span class="co">and store in a second matrix*/</span></span>
+<span id="cb231-41"><a href="instrumental-variables-estimation-stata.html#cb231-41" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> wt82_71 <span class="kw">if</span> (highprice==0)</span>
+<span id="cb231-42"><a href="instrumental-variables-estimation-stata.html#cb231-42" tabindex="-1"></a><span class="fu">matrix</span> input ey = (<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb231-43"><a href="instrumental-variables-estimation-stata.html#cb231-43" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> wt82_71 <span class="kw">if</span> (highprice==1)</span>
+<span id="cb231-44"><a href="instrumental-variables-estimation-stata.html#cb231-44" tabindex="-1"></a><span class="fu">matrix</span> ey = (ey ,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb231-45"><a href="instrumental-variables-estimation-stata.html#cb231-45" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> ey</span>
+<span id="cb231-46"><a href="instrumental-variables-estimation-stata.html#cb231-46" tabindex="-1"></a></span>
+<span id="cb231-47"><a href="instrumental-variables-estimation-stata.html#cb231-47" tabindex="-1"></a><span class="co">/*Using Stata&#39;s built-in matrix manipulation feature (Mata), </span></span>
+<span id="cb231-48"><a href="instrumental-variables-estimation-stata.html#cb231-48" tabindex="-1"></a><span class="co">calculate numerator, denominator and IV estimator*/</span></span>
+<span id="cb231-49"><a href="instrumental-variables-estimation-stata.html#cb231-49" tabindex="-1"></a>*Numerator: num = E[Y|Z=1] - E[Y|Z=0]*<span class="kw">mata</span></span>
+<span id="cb231-50"><a href="instrumental-variables-estimation-stata.html#cb231-50" tabindex="-1"></a>*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0]*</span>
+<span id="cb231-51"><a href="instrumental-variables-estimation-stata.html#cb231-51" tabindex="-1"></a>*IV estimator: iv_est = IV estimate <span class="kw">of</span> E[Ya=1] - E[Ya=0] *</span>
+<span id="cb231-52"><a href="instrumental-variables-estimation-stata.html#cb231-52" tabindex="-1"></a><span class="kw">mata</span> </span>
+<span id="cb231-53"><a href="instrumental-variables-estimation-stata.html#cb231-53" tabindex="-1"></a>pa = st_matrix(<span class="st">&quot;pa&quot;</span>)</span>
+<span id="cb231-54"><a href="instrumental-variables-estimation-stata.html#cb231-54" tabindex="-1"></a>ey = st_matrix(<span class="st">&quot;ey&quot;</span>)</span>
+<span id="cb231-55"><a href="instrumental-variables-estimation-stata.html#cb231-55" tabindex="-1"></a>num = ey[1,2] - ey[1,1] </span>
+<span id="cb231-56"><a href="instrumental-variables-estimation-stata.html#cb231-56" tabindex="-1"></a>denom = pa[1,2] - pa[1,1]</span>
+<span id="cb231-57"><a href="instrumental-variables-estimation-stata.html#cb231-57" tabindex="-1"></a>iv_est = num / denom </span>
+<span id="cb231-58"><a href="instrumental-variables-estimation-stata.html#cb231-58" tabindex="-1"></a>num</span>
+<span id="cb231-59"><a href="instrumental-variables-estimation-stata.html#cb231-59" tabindex="-1"></a>denom</span>
+<span id="cb231-60"><a href="instrumental-variables-estimation-stata.html#cb231-60" tabindex="-1"></a>st_numscalar(<span class="st">&quot;iv_est&quot;</span>, iv_est)</span>
+<span id="cb231-61"><a href="instrumental-variables-estimation-stata.html#cb231-61" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb231-62"><a href="instrumental-variables-estimation-stata.html#cb231-62" tabindex="-1"></a><span class="kw">di</span> <span class="fu">scalar</span>(iv_est)</span></code></pre></div>
 <pre><code>    Variable |        Obs        Mean    Std. dev.       Min        Max
 -------------+---------------------------------------------------------
      price82 |      1,476    1.805989    .1301703   1.451904   2.103027
@@ -490,12 +490,12 @@ <h2>Program 16.2<a href="instrumental-variables-estimation-stata.html#program-16
 <li>Data from NHEFS</li>
 <li>Section 16.2</li>
 </ul>
-<div class="sourceCode" id="cb116"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb116-1"><a href="instrumental-variables-estimation-stata.html#cb116-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
-<span id="cb116-2"><a href="instrumental-variables-estimation-stata.html#cb116-2" tabindex="-1"></a></span>
-<span id="cb116-3"><a href="instrumental-variables-estimation-stata.html#cb116-3" tabindex="-1"></a><span class="co">/* ivregress fits the model in two stages:</span></span>
-<span id="cb116-4"><a href="instrumental-variables-estimation-stata.html#cb116-4" tabindex="-1"></a><span class="co">- first model: qsmk = highprice</span></span>
-<span id="cb116-5"><a href="instrumental-variables-estimation-stata.html#cb116-5" tabindex="-1"></a><span class="co">- second model: wt82_71 = predicted_qsmk */</span></span>
-<span id="cb116-6"><a href="instrumental-variables-estimation-stata.html#cb116-6" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span></code></pre></div>
+<div class="sourceCode" id="cb233"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb233-1"><a href="instrumental-variables-estimation-stata.html#cb233-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
+<span id="cb233-2"><a href="instrumental-variables-estimation-stata.html#cb233-2" tabindex="-1"></a></span>
+<span id="cb233-3"><a href="instrumental-variables-estimation-stata.html#cb233-3" tabindex="-1"></a><span class="co">/* ivregress fits the model in two stages:</span></span>
+<span id="cb233-4"><a href="instrumental-variables-estimation-stata.html#cb233-4" tabindex="-1"></a><span class="co">- first model: qsmk = highprice</span></span>
+<span id="cb233-5"><a href="instrumental-variables-estimation-stata.html#cb233-5" tabindex="-1"></a><span class="co">- second model: wt82_71 = predicted_qsmk */</span></span>
+<span id="cb233-6"><a href="instrumental-variables-estimation-stata.html#cb233-6" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span></code></pre></div>
 <pre><code>Instrumental variables 2SLS regression            Number of obs   =      1,476
                                                   Wald chi2(1)    =       0.01
                                                   Prob &gt; chi2     =     0.9038
@@ -521,12 +521,12 @@ <h2>Program 16.3<a href="instrumental-variables-estimation-stata.html#program-16
 </li>
 <li>Section 16.2</li>
 </ul>
-<div class="sourceCode" id="cb118"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb118-1"><a href="instrumental-variables-estimation-stata.html#cb118-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
-<span id="cb118-2"><a href="instrumental-variables-estimation-stata.html#cb118-2" tabindex="-1"></a></span>
-<span id="cb118-3"><a href="instrumental-variables-estimation-stata.html#cb118-3" tabindex="-1"></a><span class="kw">gen</span> psi = 2.396</span>
-<span id="cb118-4"><a href="instrumental-variables-estimation-stata.html#cb118-4" tabindex="-1"></a><span class="kw">gen</span> hspi = wt82_71 - psi*qsmk</span>
-<span id="cb118-5"><a href="instrumental-variables-estimation-stata.html#cb118-5" tabindex="-1"></a></span>
-<span id="cb118-6"><a href="instrumental-variables-estimation-stata.html#cb118-6" tabindex="-1"></a><span class="kw">logit</span> highprice hspi</span></code></pre></div>
+<div class="sourceCode" id="cb235"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb235-1"><a href="instrumental-variables-estimation-stata.html#cb235-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
+<span id="cb235-2"><a href="instrumental-variables-estimation-stata.html#cb235-2" tabindex="-1"></a></span>
+<span id="cb235-3"><a href="instrumental-variables-estimation-stata.html#cb235-3" tabindex="-1"></a><span class="kw">gen</span> psi = 2.396</span>
+<span id="cb235-4"><a href="instrumental-variables-estimation-stata.html#cb235-4" tabindex="-1"></a><span class="kw">gen</span> hspi = wt82_71 - psi*qsmk</span>
+<span id="cb235-5"><a href="instrumental-variables-estimation-stata.html#cb235-5" tabindex="-1"></a></span>
+<span id="cb235-6"><a href="instrumental-variables-estimation-stata.html#cb235-6" tabindex="-1"></a><span class="kw">logit</span> highprice hspi</span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -187.34948  
 Iteration 1:  Log likelihood = -187.34948  
 
@@ -549,31 +549,31 @@ <h2>Program 16.4<a href="instrumental-variables-estimation-stata.html#program-16
 <li>Data from NHEFS</li>
 <li>Section 16.5</li>
 </ul>
-<div class="sourceCode" id="cb120"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb120-1"><a href="instrumental-variables-estimation-stata.html#cb120-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
-<span id="cb120-2"><a href="instrumental-variables-estimation-stata.html#cb120-2" tabindex="-1"></a></span>
-<span id="cb120-3"><a href="instrumental-variables-estimation-stata.html#cb120-3" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.6*/</span></span>
-<span id="cb120-4"><a href="instrumental-variables-estimation-stata.html#cb120-4" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
-<span id="cb120-5"><a href="instrumental-variables-estimation-stata.html#cb120-5" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.6 &amp; price82 &lt; .)</span>
-<span id="cb120-6"><a href="instrumental-variables-estimation-stata.html#cb120-6" tabindex="-1"></a></span>
-<span id="cb120-7"><a href="instrumental-variables-estimation-stata.html#cb120-7" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
-<span id="cb120-8"><a href="instrumental-variables-estimation-stata.html#cb120-8" tabindex="-1"></a></span>
-<span id="cb120-9"><a href="instrumental-variables-estimation-stata.html#cb120-9" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.7*/</span></span>
-<span id="cb120-10"><a href="instrumental-variables-estimation-stata.html#cb120-10" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
-<span id="cb120-11"><a href="instrumental-variables-estimation-stata.html#cb120-11" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.7 &amp; price82 &lt; .)</span>
-<span id="cb120-12"><a href="instrumental-variables-estimation-stata.html#cb120-12" tabindex="-1"></a></span>
-<span id="cb120-13"><a href="instrumental-variables-estimation-stata.html#cb120-13" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
-<span id="cb120-14"><a href="instrumental-variables-estimation-stata.html#cb120-14" tabindex="-1"></a></span>
-<span id="cb120-15"><a href="instrumental-variables-estimation-stata.html#cb120-15" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.8*/</span></span>
-<span id="cb120-16"><a href="instrumental-variables-estimation-stata.html#cb120-16" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
-<span id="cb120-17"><a href="instrumental-variables-estimation-stata.html#cb120-17" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.8 &amp; price82 &lt; .)</span>
-<span id="cb120-18"><a href="instrumental-variables-estimation-stata.html#cb120-18" tabindex="-1"></a></span>
-<span id="cb120-19"><a href="instrumental-variables-estimation-stata.html#cb120-19" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
-<span id="cb120-20"><a href="instrumental-variables-estimation-stata.html#cb120-20" tabindex="-1"></a></span>
-<span id="cb120-21"><a href="instrumental-variables-estimation-stata.html#cb120-21" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.9*/</span></span>
-<span id="cb120-22"><a href="instrumental-variables-estimation-stata.html#cb120-22" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
-<span id="cb120-23"><a href="instrumental-variables-estimation-stata.html#cb120-23" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.9 &amp; price82 &lt; .)</span>
-<span id="cb120-24"><a href="instrumental-variables-estimation-stata.html#cb120-24" tabindex="-1"></a></span>
-<span id="cb120-25"><a href="instrumental-variables-estimation-stata.html#cb120-25" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span></code></pre></div>
+<div class="sourceCode" id="cb237"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb237-1"><a href="instrumental-variables-estimation-stata.html#cb237-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
+<span id="cb237-2"><a href="instrumental-variables-estimation-stata.html#cb237-2" tabindex="-1"></a></span>
+<span id="cb237-3"><a href="instrumental-variables-estimation-stata.html#cb237-3" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.6*/</span></span>
+<span id="cb237-4"><a href="instrumental-variables-estimation-stata.html#cb237-4" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
+<span id="cb237-5"><a href="instrumental-variables-estimation-stata.html#cb237-5" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.6 &amp; price82 &lt; .)</span>
+<span id="cb237-6"><a href="instrumental-variables-estimation-stata.html#cb237-6" tabindex="-1"></a></span>
+<span id="cb237-7"><a href="instrumental-variables-estimation-stata.html#cb237-7" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
+<span id="cb237-8"><a href="instrumental-variables-estimation-stata.html#cb237-8" tabindex="-1"></a></span>
+<span id="cb237-9"><a href="instrumental-variables-estimation-stata.html#cb237-9" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.7*/</span></span>
+<span id="cb237-10"><a href="instrumental-variables-estimation-stata.html#cb237-10" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
+<span id="cb237-11"><a href="instrumental-variables-estimation-stata.html#cb237-11" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.7 &amp; price82 &lt; .)</span>
+<span id="cb237-12"><a href="instrumental-variables-estimation-stata.html#cb237-12" tabindex="-1"></a></span>
+<span id="cb237-13"><a href="instrumental-variables-estimation-stata.html#cb237-13" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
+<span id="cb237-14"><a href="instrumental-variables-estimation-stata.html#cb237-14" tabindex="-1"></a></span>
+<span id="cb237-15"><a href="instrumental-variables-estimation-stata.html#cb237-15" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.8*/</span></span>
+<span id="cb237-16"><a href="instrumental-variables-estimation-stata.html#cb237-16" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
+<span id="cb237-17"><a href="instrumental-variables-estimation-stata.html#cb237-17" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.8 &amp; price82 &lt; .)</span>
+<span id="cb237-18"><a href="instrumental-variables-estimation-stata.html#cb237-18" tabindex="-1"></a></span>
+<span id="cb237-19"><a href="instrumental-variables-estimation-stata.html#cb237-19" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span>
+<span id="cb237-20"><a href="instrumental-variables-estimation-stata.html#cb237-20" tabindex="-1"></a></span>
+<span id="cb237-21"><a href="instrumental-variables-estimation-stata.html#cb237-21" tabindex="-1"></a><span class="co">/*Instrument cut-point: 1.9*/</span></span>
+<span id="cb237-22"><a href="instrumental-variables-estimation-stata.html#cb237-22" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
+<span id="cb237-23"><a href="instrumental-variables-estimation-stata.html#cb237-23" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.9 &amp; price82 &lt; .)</span>
+<span id="cb237-24"><a href="instrumental-variables-estimation-stata.html#cb237-24" tabindex="-1"></a></span>
+<span id="cb237-25"><a href="instrumental-variables-estimation-stata.html#cb237-25" tabindex="-1"></a>ivregress 2sls wt82_71 (qsmk = highprice)</span></code></pre></div>
 <pre><code>(1,476 real changes made, 1,476 to missing)
 
 (1,476 real changes made)
@@ -661,14 +661,14 @@ <h2>Program 16.5<a href="instrumental-variables-estimation-stata.html#program-16
 <li>Data from NHEFS</li>
 <li>Section 16.5</li>
 </ul>
-<div class="sourceCode" id="cb122"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb122-1"><a href="instrumental-variables-estimation-stata.html#cb122-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
-<span id="cb122-2"><a href="instrumental-variables-estimation-stata.html#cb122-2" tabindex="-1"></a></span>
-<span id="cb122-3"><a href="instrumental-variables-estimation-stata.html#cb122-3" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
-<span id="cb122-4"><a href="instrumental-variables-estimation-stata.html#cb122-4" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.5 &amp; price82 &lt; .)</span>
-<span id="cb122-5"><a href="instrumental-variables-estimation-stata.html#cb122-5" tabindex="-1"></a></span>
-<span id="cb122-6"><a href="instrumental-variables-estimation-stata.html#cb122-6" tabindex="-1"></a>ivregress 2sls wt82_71 sex race c.age c.smokeintensity <span class="co">///</span></span>
-<span id="cb122-7"><a href="instrumental-variables-estimation-stata.html#cb122-7" tabindex="-1"></a>  c.smokeyrs i.exercise i.active c.wt7 <span class="co">///</span></span>
-<span id="cb122-8"><a href="instrumental-variables-estimation-stata.html#cb122-8" tabindex="-1"></a>  (qsmk = highprice)</span></code></pre></div>
+<div class="sourceCode" id="cb239"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb239-1"><a href="instrumental-variables-estimation-stata.html#cb239-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-highprice, <span class="kw">clear</span></span>
+<span id="cb239-2"><a href="instrumental-variables-estimation-stata.html#cb239-2" tabindex="-1"></a></span>
+<span id="cb239-3"><a href="instrumental-variables-estimation-stata.html#cb239-3" tabindex="-1"></a><span class="kw">replace</span> highprice = .</span>
+<span id="cb239-4"><a href="instrumental-variables-estimation-stata.html#cb239-4" tabindex="-1"></a><span class="kw">replace</span> highprice = (price82 &gt;1.5 &amp; price82 &lt; .)</span>
+<span id="cb239-5"><a href="instrumental-variables-estimation-stata.html#cb239-5" tabindex="-1"></a></span>
+<span id="cb239-6"><a href="instrumental-variables-estimation-stata.html#cb239-6" tabindex="-1"></a>ivregress 2sls wt82_71 sex race c.age c.smokeintensity <span class="co">///</span></span>
+<span id="cb239-7"><a href="instrumental-variables-estimation-stata.html#cb239-7" tabindex="-1"></a>  c.smokeyrs i.exercise i.active c.wt7 <span class="co">///</span></span>
+<span id="cb239-8"><a href="instrumental-variables-estimation-stata.html#cb239-8" tabindex="-1"></a>  (qsmk = highprice)</span></code></pre></div>
 <pre><code>(1,476 real changes made, 1,476 to missing)
 
 (1,476 real changes made)
diff --git a/docs/instrumental-variables-estimation.html b/docs/instrumental-variables-estimation.html
index 4a637c8..555a9d5 100644
--- a/docs/instrumental-variables-estimation.html
+++ b/docs/instrumental-variables-estimation.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -316,39 +316,39 @@ <h2>Program 16.1<a href="instrumental-variables-estimation.html#program-16.1" cl
 <li>Estimating the average causal using the standard IV estimator via the calculation of sample averages</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb37"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb37-1"><a href="instrumental-variables-estimation.html#cb37-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb38"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb38-1"><a href="instrumental-variables-estimation.html#cb38-1" tabindex="-1"></a><span class="co">#install.packages(&quot;readxl&quot;) # install package if required</span></span>
-<span id="cb38-2"><a href="instrumental-variables-estimation.html#cb38-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb38-3"><a href="instrumental-variables-estimation.html#cb38-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb38-4"><a href="instrumental-variables-estimation.html#cb38-4" tabindex="-1"></a></span>
-<span id="cb38-5"><a href="instrumental-variables-estimation.html#cb38-5" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
-<span id="cb38-6"><a href="instrumental-variables-estimation.html#cb38-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb38-7"><a href="instrumental-variables-estimation.html#cb38-7" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>price82)</span>
-<span id="cb38-8"><a href="instrumental-variables-estimation.html#cb38-8" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA&#39;s </span></span>
-<span id="cb38-9"><a href="instrumental-variables-estimation.html#cb38-9" tabindex="-1"></a><span class="co">#&gt;   1.452   1.740   1.815   1.806   1.868   2.103      92</span></span>
-<span id="cb38-10"><a href="instrumental-variables-estimation.html#cb38-10" tabindex="-1"></a></span>
-<span id="cb38-11"><a href="instrumental-variables-estimation.html#cb38-11" tabindex="-1"></a><span class="co"># for simplicity, ignore subjects with missing outcome or missing instrument</span></span>
-<span id="cb38-12"><a href="instrumental-variables-estimation.html#cb38-12" tabindex="-1"></a>nhefs.iv <span class="ot">&lt;-</span> nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82) <span class="sc">&amp;</span> <span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>price82)),]</span>
-<span id="cb38-13"><a href="instrumental-variables-estimation.html#cb38-13" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>highprice <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.iv<span class="sc">$</span>price82<span class="sc">&gt;=</span><span class="fl">1.5</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb38-14"><a href="instrumental-variables-estimation.html#cb38-14" tabindex="-1"></a></span>
-<span id="cb38-15"><a href="instrumental-variables-estimation.html#cb38-15" tabindex="-1"></a><span class="fu">table</span>(nhefs.iv<span class="sc">$</span>highprice, nhefs.iv<span class="sc">$</span>qsmk)</span>
-<span id="cb38-16"><a href="instrumental-variables-estimation.html#cb38-16" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb38-17"><a href="instrumental-variables-estimation.html#cb38-17" tabindex="-1"></a><span class="co">#&gt;        0    1</span></span>
-<span id="cb38-18"><a href="instrumental-variables-estimation.html#cb38-18" tabindex="-1"></a><span class="co">#&gt;   0   33    8</span></span>
-<span id="cb38-19"><a href="instrumental-variables-estimation.html#cb38-19" tabindex="-1"></a><span class="co">#&gt;   1 1065  370</span></span>
-<span id="cb38-20"><a href="instrumental-variables-estimation.html#cb38-20" tabindex="-1"></a></span>
-<span id="cb38-21"><a href="instrumental-variables-estimation.html#cb38-21" tabindex="-1"></a><span class="fu">t.test</span>(wt82_71 <span class="sc">~</span> highprice, <span class="at">data=</span>nhefs.iv)</span>
-<span id="cb38-22"><a href="instrumental-variables-estimation.html#cb38-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb38-23"><a href="instrumental-variables-estimation.html#cb38-23" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb38-24"><a href="instrumental-variables-estimation.html#cb38-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb38-25"><a href="instrumental-variables-estimation.html#cb38-25" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by highprice</span></span>
-<span id="cb38-26"><a href="instrumental-variables-estimation.html#cb38-26" tabindex="-1"></a><span class="co">#&gt; t = -0.10179, df = 41.644, p-value = 0.9194</span></span>
-<span id="cb38-27"><a href="instrumental-variables-estimation.html#cb38-27" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb38-28"><a href="instrumental-variables-estimation.html#cb38-28" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb38-29"><a href="instrumental-variables-estimation.html#cb38-29" tabindex="-1"></a><span class="co">#&gt;  -3.130588  2.830010</span></span>
-<span id="cb38-30"><a href="instrumental-variables-estimation.html#cb38-30" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb38-31"><a href="instrumental-variables-estimation.html#cb38-31" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb38-32"><a href="instrumental-variables-estimation.html#cb38-32" tabindex="-1"></a><span class="co">#&gt;        2.535729        2.686018</span></span></code></pre></div>
+<div class="sourceCode" id="cb137"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb137-1"><a href="instrumental-variables-estimation.html#cb137-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb138"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb138-1"><a href="instrumental-variables-estimation.html#cb138-1" tabindex="-1"></a><span class="co">#install.packages(&quot;readxl&quot;) # install package if required</span></span>
+<span id="cb138-2"><a href="instrumental-variables-estimation.html#cb138-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb138-3"><a href="instrumental-variables-estimation.html#cb138-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb138-4"><a href="instrumental-variables-estimation.html#cb138-4" tabindex="-1"></a></span>
+<span id="cb138-5"><a href="instrumental-variables-estimation.html#cb138-5" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
+<span id="cb138-6"><a href="instrumental-variables-estimation.html#cb138-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb138-7"><a href="instrumental-variables-estimation.html#cb138-7" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>price82)</span>
+<span id="cb138-8"><a href="instrumental-variables-estimation.html#cb138-8" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA&#39;s </span></span>
+<span id="cb138-9"><a href="instrumental-variables-estimation.html#cb138-9" tabindex="-1"></a><span class="co">#&gt;   1.452   1.740   1.815   1.806   1.868   2.103      92</span></span></code></pre></div>
+<div class="sourceCode" id="cb139"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb139-1"><a href="instrumental-variables-estimation.html#cb139-1" tabindex="-1"></a></span>
+<span id="cb139-2"><a href="instrumental-variables-estimation.html#cb139-2" tabindex="-1"></a><span class="co"># for simplicity, ignore subjects with missing outcome or missing instrument</span></span>
+<span id="cb139-3"><a href="instrumental-variables-estimation.html#cb139-3" tabindex="-1"></a>nhefs.iv <span class="ot">&lt;-</span> nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82) <span class="sc">&amp;</span> <span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>price82)),]</span>
+<span id="cb139-4"><a href="instrumental-variables-estimation.html#cb139-4" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>highprice <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(nhefs.iv<span class="sc">$</span>price82<span class="sc">&gt;=</span><span class="fl">1.5</span>, <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb139-5"><a href="instrumental-variables-estimation.html#cb139-5" tabindex="-1"></a></span>
+<span id="cb139-6"><a href="instrumental-variables-estimation.html#cb139-6" tabindex="-1"></a><span class="fu">table</span>(nhefs.iv<span class="sc">$</span>highprice, nhefs.iv<span class="sc">$</span>qsmk)</span>
+<span id="cb139-7"><a href="instrumental-variables-estimation.html#cb139-7" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb139-8"><a href="instrumental-variables-estimation.html#cb139-8" tabindex="-1"></a><span class="co">#&gt;        0    1</span></span>
+<span id="cb139-9"><a href="instrumental-variables-estimation.html#cb139-9" tabindex="-1"></a><span class="co">#&gt;   0   33    8</span></span>
+<span id="cb139-10"><a href="instrumental-variables-estimation.html#cb139-10" tabindex="-1"></a><span class="co">#&gt;   1 1065  370</span></span></code></pre></div>
+<div class="sourceCode" id="cb140"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb140-1"><a href="instrumental-variables-estimation.html#cb140-1" tabindex="-1"></a></span>
+<span id="cb140-2"><a href="instrumental-variables-estimation.html#cb140-2" tabindex="-1"></a><span class="fu">t.test</span>(wt82_71 <span class="sc">~</span> highprice, <span class="at">data=</span>nhefs.iv)</span>
+<span id="cb140-3"><a href="instrumental-variables-estimation.html#cb140-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb140-4"><a href="instrumental-variables-estimation.html#cb140-4" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb140-5"><a href="instrumental-variables-estimation.html#cb140-5" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb140-6"><a href="instrumental-variables-estimation.html#cb140-6" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by highprice</span></span>
+<span id="cb140-7"><a href="instrumental-variables-estimation.html#cb140-7" tabindex="-1"></a><span class="co">#&gt; t = -0.10179, df = 41.644, p-value = 0.9194</span></span>
+<span id="cb140-8"><a href="instrumental-variables-estimation.html#cb140-8" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb140-9"><a href="instrumental-variables-estimation.html#cb140-9" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb140-10"><a href="instrumental-variables-estimation.html#cb140-10" tabindex="-1"></a><span class="co">#&gt;  -3.130588  2.830010</span></span>
+<span id="cb140-11"><a href="instrumental-variables-estimation.html#cb140-11" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb140-12"><a href="instrumental-variables-estimation.html#cb140-12" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb140-13"><a href="instrumental-variables-estimation.html#cb140-13" tabindex="-1"></a><span class="co">#&gt;        2.535729        2.686018</span></span></code></pre></div>
 </div>
 <div id="program-16.2" class="section level2 hasAnchor">
 <h2>Program 16.2<a href="instrumental-variables-estimation.html#program-16.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -356,31 +356,31 @@ <h2>Program 16.2<a href="instrumental-variables-estimation.html#program-16.2" cl
 <li>Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb39"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb39-1"><a href="instrumental-variables-estimation.html#cb39-1" tabindex="-1"></a><span class="co">#install.packages (&quot;sem&quot;) # install package if required</span></span>
-<span id="cb39-2"><a href="instrumental-variables-estimation.html#cb39-2" tabindex="-1"></a><span class="fu">library</span>(sem)</span>
-<span id="cb39-3"><a href="instrumental-variables-estimation.html#cb39-3" tabindex="-1"></a></span>
-<span id="cb39-4"><a href="instrumental-variables-estimation.html#cb39-4" tabindex="-1"></a>model1 <span class="ot">&lt;-</span> <span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> highprice, <span class="at">data =</span> nhefs.iv)</span>
-<span id="cb39-5"><a href="instrumental-variables-estimation.html#cb39-5" tabindex="-1"></a><span class="fu">summary</span>(model1)</span>
-<span id="cb39-6"><a href="instrumental-variables-estimation.html#cb39-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-7"><a href="instrumental-variables-estimation.html#cb39-7" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb39-8"><a href="instrumental-variables-estimation.html#cb39-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-9"><a href="instrumental-variables-estimation.html#cb39-9" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
-<span id="cb39-10"><a href="instrumental-variables-estimation.html#cb39-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-11"><a href="instrumental-variables-estimation.html#cb39-11" tabindex="-1"></a><span class="co">#&gt; Instruments: ~highprice</span></span>
-<span id="cb39-12"><a href="instrumental-variables-estimation.html#cb39-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-13"><a href="instrumental-variables-estimation.html#cb39-13" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb39-14"><a href="instrumental-variables-estimation.html#cb39-14" tabindex="-1"></a><span class="co">#&gt;      Min.   1st Qu.    Median      Mean   3rd Qu.      Max. </span></span>
-<span id="cb39-15"><a href="instrumental-variables-estimation.html#cb39-15" tabindex="-1"></a><span class="co">#&gt; -43.34863  -4.00206  -0.02712   0.00000   4.17040  46.47022 </span></span>
-<span id="cb39-16"><a href="instrumental-variables-estimation.html#cb39-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-17"><a href="instrumental-variables-estimation.html#cb39-17" tabindex="-1"></a><span class="co">#&gt;              Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb39-18"><a href="instrumental-variables-estimation.html#cb39-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)  2.068164   5.085098 0.40671  0.68428</span></span>
-<span id="cb39-19"><a href="instrumental-variables-estimation.html#cb39-19" tabindex="-1"></a><span class="co">#&gt; qsmk         2.396270  19.840037 0.12078  0.90388</span></span>
-<span id="cb39-20"><a href="instrumental-variables-estimation.html#cb39-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb39-21"><a href="instrumental-variables-estimation.html#cb39-21" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 7.8561141 on 1474 degrees of freedom</span></span>
-<span id="cb39-22"><a href="instrumental-variables-estimation.html#cb39-22" tabindex="-1"></a><span class="fu">confint</span>(model1)  <span class="co"># note the wide confidence intervals</span></span>
-<span id="cb39-23"><a href="instrumental-variables-estimation.html#cb39-23" tabindex="-1"></a><span class="co">#&gt;                  2.5 %   97.5 %</span></span>
-<span id="cb39-24"><a href="instrumental-variables-estimation.html#cb39-24" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -7.898445 12.03477</span></span>
-<span id="cb39-25"><a href="instrumental-variables-estimation.html#cb39-25" tabindex="-1"></a><span class="co">#&gt; qsmk        -36.489487 41.28203</span></span></code></pre></div>
+<div class="sourceCode" id="cb141"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb141-1"><a href="instrumental-variables-estimation.html#cb141-1" tabindex="-1"></a><span class="co">#install.packages (&quot;sem&quot;) # install package if required</span></span>
+<span id="cb141-2"><a href="instrumental-variables-estimation.html#cb141-2" tabindex="-1"></a><span class="fu">library</span>(sem)</span>
+<span id="cb141-3"><a href="instrumental-variables-estimation.html#cb141-3" tabindex="-1"></a></span>
+<span id="cb141-4"><a href="instrumental-variables-estimation.html#cb141-4" tabindex="-1"></a>model1 <span class="ot">&lt;-</span> <span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> highprice, <span class="at">data =</span> nhefs.iv)</span>
+<span id="cb141-5"><a href="instrumental-variables-estimation.html#cb141-5" tabindex="-1"></a><span class="fu">summary</span>(model1)</span>
+<span id="cb141-6"><a href="instrumental-variables-estimation.html#cb141-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-7"><a href="instrumental-variables-estimation.html#cb141-7" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb141-8"><a href="instrumental-variables-estimation.html#cb141-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-9"><a href="instrumental-variables-estimation.html#cb141-9" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
+<span id="cb141-10"><a href="instrumental-variables-estimation.html#cb141-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-11"><a href="instrumental-variables-estimation.html#cb141-11" tabindex="-1"></a><span class="co">#&gt; Instruments: ~highprice</span></span>
+<span id="cb141-12"><a href="instrumental-variables-estimation.html#cb141-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-13"><a href="instrumental-variables-estimation.html#cb141-13" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb141-14"><a href="instrumental-variables-estimation.html#cb141-14" tabindex="-1"></a><span class="co">#&gt;      Min.   1st Qu.    Median      Mean   3rd Qu.      Max. </span></span>
+<span id="cb141-15"><a href="instrumental-variables-estimation.html#cb141-15" tabindex="-1"></a><span class="co">#&gt; -43.34863  -4.00206  -0.02712   0.00000   4.17040  46.47022 </span></span>
+<span id="cb141-16"><a href="instrumental-variables-estimation.html#cb141-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-17"><a href="instrumental-variables-estimation.html#cb141-17" tabindex="-1"></a><span class="co">#&gt;              Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb141-18"><a href="instrumental-variables-estimation.html#cb141-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)  2.068164   5.085098 0.40671  0.68428</span></span>
+<span id="cb141-19"><a href="instrumental-variables-estimation.html#cb141-19" tabindex="-1"></a><span class="co">#&gt; qsmk         2.396270  19.840037 0.12078  0.90388</span></span>
+<span id="cb141-20"><a href="instrumental-variables-estimation.html#cb141-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb141-21"><a href="instrumental-variables-estimation.html#cb141-21" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 7.8561141 on 1474 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb142"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb142-1"><a href="instrumental-variables-estimation.html#cb142-1" tabindex="-1"></a><span class="fu">confint</span>(model1)  <span class="co"># note the wide confidence intervals</span></span>
+<span id="cb142-2"><a href="instrumental-variables-estimation.html#cb142-2" tabindex="-1"></a><span class="co">#&gt;                  2.5 %   97.5 %</span></span>
+<span id="cb142-3"><a href="instrumental-variables-estimation.html#cb142-3" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -7.898445 12.03477</span></span>
+<span id="cb142-4"><a href="instrumental-variables-estimation.html#cb142-4" tabindex="-1"></a><span class="co">#&gt; qsmk        -36.489487 41.28203</span></span></code></pre></div>
 </div>
 <div id="program-16.3" class="section level2 hasAnchor">
 <h2>Program 16.3<a href="instrumental-variables-estimation.html#program-16.3" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -390,41 +390,41 @@ <h2>Program 16.3<a href="instrumental-variables-estimation.html#program-16.3" cl
 <li>G-estimation: Checking one possible value of psi</li>
 <li>See Chapter 14 for program that checks several values and computes 95% confidence intervals</li>
 </ul>
-<div class="sourceCode" id="cb40"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb40-1"><a href="instrumental-variables-estimation.html#cb40-1" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>psi <span class="ot">&lt;-</span> <span class="fl">2.396</span></span>
-<span id="cb40-2"><a href="instrumental-variables-estimation.html#cb40-2" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs.iv<span class="sc">$</span>wt82_71<span class="sc">-</span>nhefs.iv<span class="sc">$</span>psi<span class="sc">*</span>nhefs.iv<span class="sc">$</span>qsmk</span>
-<span id="cb40-3"><a href="instrumental-variables-estimation.html#cb40-3" tabindex="-1"></a></span>
-<span id="cb40-4"><a href="instrumental-variables-estimation.html#cb40-4" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;) # install package if required</span></span>
-<span id="cb40-5"><a href="instrumental-variables-estimation.html#cb40-5" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
-<span id="cb40-6"><a href="instrumental-variables-estimation.html#cb40-6" tabindex="-1"></a>g.est <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(highprice <span class="sc">~</span> Hpsi, <span class="at">data=</span>nhefs.iv, <span class="at">id=</span>seqn, <span class="at">family=</span><span class="fu">binomial</span>(),</span>
-<span id="cb40-7"><a href="instrumental-variables-estimation.html#cb40-7" tabindex="-1"></a>                <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
-<span id="cb40-8"><a href="instrumental-variables-estimation.html#cb40-8" tabindex="-1"></a><span class="fu">summary</span>(g.est)</span>
-<span id="cb40-9"><a href="instrumental-variables-estimation.html#cb40-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb40-10"><a href="instrumental-variables-estimation.html#cb40-10" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb40-11"><a href="instrumental-variables-estimation.html#cb40-11" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = highprice ~ Hpsi, family = binomial(), data = nhefs.iv, </span></span>
-<span id="cb40-12"><a href="instrumental-variables-estimation.html#cb40-12" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb40-13"><a href="instrumental-variables-estimation.html#cb40-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb40-14"><a href="instrumental-variables-estimation.html#cb40-14" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb40-15"><a href="instrumental-variables-estimation.html#cb40-15" tabindex="-1"></a><span class="co">#&gt;              Estimate   Std.err  Wald Pr(&gt;|W|)    </span></span>
-<span id="cb40-16"><a href="instrumental-variables-estimation.html#cb40-16" tabindex="-1"></a><span class="co">#&gt; (Intercept) 3.555e+00 1.652e-01 463.1   &lt;2e-16 ***</span></span>
-<span id="cb40-17"><a href="instrumental-variables-estimation.html#cb40-17" tabindex="-1"></a><span class="co">#&gt; Hpsi        2.748e-07 2.273e-02   0.0        1    </span></span>
-<span id="cb40-18"><a href="instrumental-variables-estimation.html#cb40-18" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb40-19"><a href="instrumental-variables-estimation.html#cb40-19" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb40-20"><a href="instrumental-variables-estimation.html#cb40-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb40-21"><a href="instrumental-variables-estimation.html#cb40-21" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb40-22"><a href="instrumental-variables-estimation.html#cb40-22" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb40-23"><a href="instrumental-variables-estimation.html#cb40-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb40-24"><a href="instrumental-variables-estimation.html#cb40-24" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb40-25"><a href="instrumental-variables-estimation.html#cb40-25" tabindex="-1"></a><span class="co">#&gt; (Intercept)        1  0.7607</span></span>
-<span id="cb40-26"><a href="instrumental-variables-estimation.html#cb40-26" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1476  Maximum cluster size: 1</span></span>
-<span id="cb40-27"><a href="instrumental-variables-estimation.html#cb40-27" tabindex="-1"></a></span>
-<span id="cb40-28"><a href="instrumental-variables-estimation.html#cb40-28" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(g.est)</span>
-<span id="cb40-29"><a href="instrumental-variables-estimation.html#cb40-29" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(g.est))[,<span class="dv">2</span>]</span>
-<span id="cb40-30"><a href="instrumental-variables-estimation.html#cb40-30" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta<span class="sc">-</span><span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>SE</span>
-<span id="cb40-31"><a href="instrumental-variables-estimation.html#cb40-31" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta<span class="sc">+</span><span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>SE</span>
-<span id="cb40-32"><a href="instrumental-variables-estimation.html#cb40-32" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb40-33"><a href="instrumental-variables-estimation.html#cb40-33" tabindex="-1"></a><span class="co">#&gt;                  beta      lcl     ucl</span></span>
-<span id="cb40-34"><a href="instrumental-variables-estimation.html#cb40-34" tabindex="-1"></a><span class="co">#&gt; (Intercept) 3.555e+00  3.23152 3.87917</span></span>
-<span id="cb40-35"><a href="instrumental-variables-estimation.html#cb40-35" tabindex="-1"></a><span class="co">#&gt; Hpsi        2.748e-07 -0.04456 0.04456</span></span></code></pre></div>
+<div class="sourceCode" id="cb143"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb143-1"><a href="instrumental-variables-estimation.html#cb143-1" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>psi <span class="ot">&lt;-</span> <span class="fl">2.396</span></span>
+<span id="cb143-2"><a href="instrumental-variables-estimation.html#cb143-2" tabindex="-1"></a>nhefs.iv<span class="sc">$</span>Hpsi <span class="ot">&lt;-</span> nhefs.iv<span class="sc">$</span>wt82_71<span class="sc">-</span>nhefs.iv<span class="sc">$</span>psi<span class="sc">*</span>nhefs.iv<span class="sc">$</span>qsmk</span>
+<span id="cb143-3"><a href="instrumental-variables-estimation.html#cb143-3" tabindex="-1"></a></span>
+<span id="cb143-4"><a href="instrumental-variables-estimation.html#cb143-4" tabindex="-1"></a><span class="co">#install.packages(&quot;geepack&quot;) # install package if required</span></span>
+<span id="cb143-5"><a href="instrumental-variables-estimation.html#cb143-5" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
+<span id="cb143-6"><a href="instrumental-variables-estimation.html#cb143-6" tabindex="-1"></a>g.est <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(highprice <span class="sc">~</span> Hpsi, <span class="at">data=</span>nhefs.iv, <span class="at">id=</span>seqn, <span class="at">family=</span><span class="fu">binomial</span>(),</span>
+<span id="cb143-7"><a href="instrumental-variables-estimation.html#cb143-7" tabindex="-1"></a>                <span class="at">corstr=</span><span class="st">&quot;independence&quot;</span>)</span>
+<span id="cb143-8"><a href="instrumental-variables-estimation.html#cb143-8" tabindex="-1"></a><span class="fu">summary</span>(g.est)</span>
+<span id="cb143-9"><a href="instrumental-variables-estimation.html#cb143-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb143-10"><a href="instrumental-variables-estimation.html#cb143-10" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb143-11"><a href="instrumental-variables-estimation.html#cb143-11" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = highprice ~ Hpsi, family = binomial(), data = nhefs.iv, </span></span>
+<span id="cb143-12"><a href="instrumental-variables-estimation.html#cb143-12" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb143-13"><a href="instrumental-variables-estimation.html#cb143-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb143-14"><a href="instrumental-variables-estimation.html#cb143-14" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb143-15"><a href="instrumental-variables-estimation.html#cb143-15" tabindex="-1"></a><span class="co">#&gt;              Estimate   Std.err  Wald Pr(&gt;|W|)    </span></span>
+<span id="cb143-16"><a href="instrumental-variables-estimation.html#cb143-16" tabindex="-1"></a><span class="co">#&gt; (Intercept) 3.555e+00 1.652e-01 463.1   &lt;2e-16 ***</span></span>
+<span id="cb143-17"><a href="instrumental-variables-estimation.html#cb143-17" tabindex="-1"></a><span class="co">#&gt; Hpsi        2.748e-07 2.273e-02   0.0        1    </span></span>
+<span id="cb143-18"><a href="instrumental-variables-estimation.html#cb143-18" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb143-19"><a href="instrumental-variables-estimation.html#cb143-19" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb143-20"><a href="instrumental-variables-estimation.html#cb143-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb143-21"><a href="instrumental-variables-estimation.html#cb143-21" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb143-22"><a href="instrumental-variables-estimation.html#cb143-22" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb143-23"><a href="instrumental-variables-estimation.html#cb143-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb143-24"><a href="instrumental-variables-estimation.html#cb143-24" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb143-25"><a href="instrumental-variables-estimation.html#cb143-25" tabindex="-1"></a><span class="co">#&gt; (Intercept)        1  0.7607</span></span>
+<span id="cb143-26"><a href="instrumental-variables-estimation.html#cb143-26" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1476  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb144"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb144-1"><a href="instrumental-variables-estimation.html#cb144-1" tabindex="-1"></a></span>
+<span id="cb144-2"><a href="instrumental-variables-estimation.html#cb144-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(g.est)</span>
+<span id="cb144-3"><a href="instrumental-variables-estimation.html#cb144-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(g.est))[,<span class="dv">2</span>]</span>
+<span id="cb144-4"><a href="instrumental-variables-estimation.html#cb144-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta<span class="sc">-</span><span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>SE</span>
+<span id="cb144-5"><a href="instrumental-variables-estimation.html#cb144-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta<span class="sc">+</span><span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>SE</span>
+<span id="cb144-6"><a href="instrumental-variables-estimation.html#cb144-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb144-7"><a href="instrumental-variables-estimation.html#cb144-7" tabindex="-1"></a><span class="co">#&gt;                  beta      lcl     ucl</span></span>
+<span id="cb144-8"><a href="instrumental-variables-estimation.html#cb144-8" tabindex="-1"></a><span class="co">#&gt; (Intercept) 3.555e+00  3.23152 3.87917</span></span>
+<span id="cb144-9"><a href="instrumental-variables-estimation.html#cb144-9" tabindex="-1"></a><span class="co">#&gt; Hpsi        2.748e-07 -0.04456 0.04456</span></span></code></pre></div>
 </div>
 <div id="program-16.4" class="section level2 hasAnchor">
 <h2>Program 16.4<a href="instrumental-variables-estimation.html#program-16.4" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -432,74 +432,74 @@ <h2>Program 16.4<a href="instrumental-variables-estimation.html#program-16.4" cl
 <li>Estimating the average causal using the standard IV estimator with altnerative proposed instruments</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb41"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb41-1"><a href="instrumental-variables-estimation.html#cb41-1" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.6</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
-<span id="cb41-2"><a href="instrumental-variables-estimation.html#cb41-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-3"><a href="instrumental-variables-estimation.html#cb41-3" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb41-4"><a href="instrumental-variables-estimation.html#cb41-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-5"><a href="instrumental-variables-estimation.html#cb41-5" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
-<span id="cb41-6"><a href="instrumental-variables-estimation.html#cb41-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-7"><a href="instrumental-variables-estimation.html#cb41-7" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.6, 1, 0)</span></span>
-<span id="cb41-8"><a href="instrumental-variables-estimation.html#cb41-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-9"><a href="instrumental-variables-estimation.html#cb41-9" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb41-10"><a href="instrumental-variables-estimation.html#cb41-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb41-11"><a href="instrumental-variables-estimation.html#cb41-11" tabindex="-1"></a><span class="co">#&gt;   -55.6   -13.5     7.6     0.0    12.5    56.4 </span></span>
-<span id="cb41-12"><a href="instrumental-variables-estimation.html#cb41-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-13"><a href="instrumental-variables-estimation.html#cb41-13" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb41-14"><a href="instrumental-variables-estimation.html#cb41-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)    -7.89      42.25  -0.187    0.852</span></span>
-<span id="cb41-15"><a href="instrumental-variables-estimation.html#cb41-15" tabindex="-1"></a><span class="co">#&gt; qsmk           41.28     164.95   0.250    0.802</span></span>
-<span id="cb41-16"><a href="instrumental-variables-estimation.html#cb41-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-17"><a href="instrumental-variables-estimation.html#cb41-17" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 18.6055 on 1474 degrees of freedom</span></span>
-<span id="cb41-18"><a href="instrumental-variables-estimation.html#cb41-18" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.7</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
-<span id="cb41-19"><a href="instrumental-variables-estimation.html#cb41-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-20"><a href="instrumental-variables-estimation.html#cb41-20" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb41-21"><a href="instrumental-variables-estimation.html#cb41-21" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-22"><a href="instrumental-variables-estimation.html#cb41-22" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
-<span id="cb41-23"><a href="instrumental-variables-estimation.html#cb41-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-24"><a href="instrumental-variables-estimation.html#cb41-24" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.7, 1, 0)</span></span>
-<span id="cb41-25"><a href="instrumental-variables-estimation.html#cb41-25" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-26"><a href="instrumental-variables-estimation.html#cb41-26" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb41-27"><a href="instrumental-variables-estimation.html#cb41-27" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb41-28"><a href="instrumental-variables-estimation.html#cb41-28" tabindex="-1"></a><span class="co">#&gt;   -54.4   -13.4    -8.4     0.0    18.1    75.3 </span></span>
-<span id="cb41-29"><a href="instrumental-variables-estimation.html#cb41-29" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-30"><a href="instrumental-variables-estimation.html#cb41-30" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb41-31"><a href="instrumental-variables-estimation.html#cb41-31" tabindex="-1"></a><span class="co">#&gt; (Intercept)    13.16      48.08   0.274    0.784</span></span>
-<span id="cb41-32"><a href="instrumental-variables-estimation.html#cb41-32" tabindex="-1"></a><span class="co">#&gt; qsmk          -40.91     187.74  -0.218    0.828</span></span>
-<span id="cb41-33"><a href="instrumental-variables-estimation.html#cb41-33" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-34"><a href="instrumental-variables-estimation.html#cb41-34" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 20.591 on 1474 degrees of freedom</span></span>
-<span id="cb41-35"><a href="instrumental-variables-estimation.html#cb41-35" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.8</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
-<span id="cb41-36"><a href="instrumental-variables-estimation.html#cb41-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-37"><a href="instrumental-variables-estimation.html#cb41-37" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb41-38"><a href="instrumental-variables-estimation.html#cb41-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-39"><a href="instrumental-variables-estimation.html#cb41-39" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
-<span id="cb41-40"><a href="instrumental-variables-estimation.html#cb41-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-41"><a href="instrumental-variables-estimation.html#cb41-41" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.8, 1, 0)</span></span>
-<span id="cb41-42"><a href="instrumental-variables-estimation.html#cb41-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-43"><a href="instrumental-variables-estimation.html#cb41-43" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb41-44"><a href="instrumental-variables-estimation.html#cb41-44" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb41-45"><a href="instrumental-variables-estimation.html#cb41-45" tabindex="-1"></a><span class="co">#&gt;  -49.37   -8.31   -3.44    0.00    7.27   60.53 </span></span>
-<span id="cb41-46"><a href="instrumental-variables-estimation.html#cb41-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-47"><a href="instrumental-variables-estimation.html#cb41-47" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb41-48"><a href="instrumental-variables-estimation.html#cb41-48" tabindex="-1"></a><span class="co">#&gt; (Intercept)    8.086      7.288   1.110    0.267</span></span>
-<span id="cb41-49"><a href="instrumental-variables-estimation.html#cb41-49" tabindex="-1"></a><span class="co">#&gt; qsmk         -21.103     28.428  -0.742    0.458</span></span>
-<span id="cb41-50"><a href="instrumental-variables-estimation.html#cb41-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-51"><a href="instrumental-variables-estimation.html#cb41-51" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 13.0188 on 1474 degrees of freedom</span></span>
-<span id="cb41-52"><a href="instrumental-variables-estimation.html#cb41-52" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.9</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
-<span id="cb41-53"><a href="instrumental-variables-estimation.html#cb41-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-54"><a href="instrumental-variables-estimation.html#cb41-54" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb41-55"><a href="instrumental-variables-estimation.html#cb41-55" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-56"><a href="instrumental-variables-estimation.html#cb41-56" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
-<span id="cb41-57"><a href="instrumental-variables-estimation.html#cb41-57" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-58"><a href="instrumental-variables-estimation.html#cb41-58" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.9, 1, 0)</span></span>
-<span id="cb41-59"><a href="instrumental-variables-estimation.html#cb41-59" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-60"><a href="instrumental-variables-estimation.html#cb41-60" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb41-61"><a href="instrumental-variables-estimation.html#cb41-61" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb41-62"><a href="instrumental-variables-estimation.html#cb41-62" tabindex="-1"></a><span class="co">#&gt;  -47.24   -6.33   -1.43    0.00    5.52   54.36 </span></span>
-<span id="cb41-63"><a href="instrumental-variables-estimation.html#cb41-63" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-64"><a href="instrumental-variables-estimation.html#cb41-64" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb41-65"><a href="instrumental-variables-estimation.html#cb41-65" tabindex="-1"></a><span class="co">#&gt; (Intercept)    5.963      6.067   0.983    0.326</span></span>
-<span id="cb41-66"><a href="instrumental-variables-estimation.html#cb41-66" tabindex="-1"></a><span class="co">#&gt; qsmk         -12.811     23.667  -0.541    0.588</span></span>
-<span id="cb41-67"><a href="instrumental-variables-estimation.html#cb41-67" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb41-68"><a href="instrumental-variables-estimation.html#cb41-68" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 10.3637 on 1474 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb145"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb145-1"><a href="instrumental-variables-estimation.html#cb145-1" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.6</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
+<span id="cb145-2"><a href="instrumental-variables-estimation.html#cb145-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-3"><a href="instrumental-variables-estimation.html#cb145-3" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb145-4"><a href="instrumental-variables-estimation.html#cb145-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-5"><a href="instrumental-variables-estimation.html#cb145-5" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
+<span id="cb145-6"><a href="instrumental-variables-estimation.html#cb145-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-7"><a href="instrumental-variables-estimation.html#cb145-7" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.6, 1, 0)</span></span>
+<span id="cb145-8"><a href="instrumental-variables-estimation.html#cb145-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-9"><a href="instrumental-variables-estimation.html#cb145-9" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb145-10"><a href="instrumental-variables-estimation.html#cb145-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb145-11"><a href="instrumental-variables-estimation.html#cb145-11" tabindex="-1"></a><span class="co">#&gt;   -55.6   -13.5     7.6     0.0    12.5    56.4 </span></span>
+<span id="cb145-12"><a href="instrumental-variables-estimation.html#cb145-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-13"><a href="instrumental-variables-estimation.html#cb145-13" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb145-14"><a href="instrumental-variables-estimation.html#cb145-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)    -7.89      42.25  -0.187    0.852</span></span>
+<span id="cb145-15"><a href="instrumental-variables-estimation.html#cb145-15" tabindex="-1"></a><span class="co">#&gt; qsmk           41.28     164.95   0.250    0.802</span></span>
+<span id="cb145-16"><a href="instrumental-variables-estimation.html#cb145-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb145-17"><a href="instrumental-variables-estimation.html#cb145-17" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 18.6055 on 1474 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb146"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb146-1"><a href="instrumental-variables-estimation.html#cb146-1" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.7</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
+<span id="cb146-2"><a href="instrumental-variables-estimation.html#cb146-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-3"><a href="instrumental-variables-estimation.html#cb146-3" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb146-4"><a href="instrumental-variables-estimation.html#cb146-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-5"><a href="instrumental-variables-estimation.html#cb146-5" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
+<span id="cb146-6"><a href="instrumental-variables-estimation.html#cb146-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-7"><a href="instrumental-variables-estimation.html#cb146-7" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.7, 1, 0)</span></span>
+<span id="cb146-8"><a href="instrumental-variables-estimation.html#cb146-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-9"><a href="instrumental-variables-estimation.html#cb146-9" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb146-10"><a href="instrumental-variables-estimation.html#cb146-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb146-11"><a href="instrumental-variables-estimation.html#cb146-11" tabindex="-1"></a><span class="co">#&gt;   -54.4   -13.4    -8.4     0.0    18.1    75.3 </span></span>
+<span id="cb146-12"><a href="instrumental-variables-estimation.html#cb146-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-13"><a href="instrumental-variables-estimation.html#cb146-13" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb146-14"><a href="instrumental-variables-estimation.html#cb146-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)    13.16      48.08   0.274    0.784</span></span>
+<span id="cb146-15"><a href="instrumental-variables-estimation.html#cb146-15" tabindex="-1"></a><span class="co">#&gt; qsmk          -40.91     187.74  -0.218    0.828</span></span>
+<span id="cb146-16"><a href="instrumental-variables-estimation.html#cb146-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb146-17"><a href="instrumental-variables-estimation.html#cb146-17" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 20.591 on 1474 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb147"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb147-1"><a href="instrumental-variables-estimation.html#cb147-1" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.8</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
+<span id="cb147-2"><a href="instrumental-variables-estimation.html#cb147-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-3"><a href="instrumental-variables-estimation.html#cb147-3" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb147-4"><a href="instrumental-variables-estimation.html#cb147-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-5"><a href="instrumental-variables-estimation.html#cb147-5" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
+<span id="cb147-6"><a href="instrumental-variables-estimation.html#cb147-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-7"><a href="instrumental-variables-estimation.html#cb147-7" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.8, 1, 0)</span></span>
+<span id="cb147-8"><a href="instrumental-variables-estimation.html#cb147-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-9"><a href="instrumental-variables-estimation.html#cb147-9" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb147-10"><a href="instrumental-variables-estimation.html#cb147-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb147-11"><a href="instrumental-variables-estimation.html#cb147-11" tabindex="-1"></a><span class="co">#&gt;  -49.37   -8.31   -3.44    0.00    7.27   60.53 </span></span>
+<span id="cb147-12"><a href="instrumental-variables-estimation.html#cb147-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-13"><a href="instrumental-variables-estimation.html#cb147-13" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb147-14"><a href="instrumental-variables-estimation.html#cb147-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)    8.086      7.288   1.110    0.267</span></span>
+<span id="cb147-15"><a href="instrumental-variables-estimation.html#cb147-15" tabindex="-1"></a><span class="co">#&gt; qsmk         -21.103     28.428  -0.742    0.458</span></span>
+<span id="cb147-16"><a href="instrumental-variables-estimation.html#cb147-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb147-17"><a href="instrumental-variables-estimation.html#cb147-17" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 13.0188 on 1474 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb148"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb148-1"><a href="instrumental-variables-estimation.html#cb148-1" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="sc">~</span> <span class="fu">ifelse</span>(price82 <span class="sc">&gt;=</span> <span class="fl">1.9</span>, <span class="dv">1</span>, <span class="dv">0</span>), <span class="at">data =</span> nhefs.iv))</span>
+<span id="cb148-2"><a href="instrumental-variables-estimation.html#cb148-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-3"><a href="instrumental-variables-estimation.html#cb148-3" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb148-4"><a href="instrumental-variables-estimation.html#cb148-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-5"><a href="instrumental-variables-estimation.html#cb148-5" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk</span></span>
+<span id="cb148-6"><a href="instrumental-variables-estimation.html#cb148-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-7"><a href="instrumental-variables-estimation.html#cb148-7" tabindex="-1"></a><span class="co">#&gt; Instruments: ~ifelse(price82 &gt;= 1.9, 1, 0)</span></span>
+<span id="cb148-8"><a href="instrumental-variables-estimation.html#cb148-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-9"><a href="instrumental-variables-estimation.html#cb148-9" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb148-10"><a href="instrumental-variables-estimation.html#cb148-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb148-11"><a href="instrumental-variables-estimation.html#cb148-11" tabindex="-1"></a><span class="co">#&gt;  -47.24   -6.33   -1.43    0.00    5.52   54.36 </span></span>
+<span id="cb148-12"><a href="instrumental-variables-estimation.html#cb148-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-13"><a href="instrumental-variables-estimation.html#cb148-13" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb148-14"><a href="instrumental-variables-estimation.html#cb148-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)    5.963      6.067   0.983    0.326</span></span>
+<span id="cb148-15"><a href="instrumental-variables-estimation.html#cb148-15" tabindex="-1"></a><span class="co">#&gt; qsmk         -12.811     23.667  -0.541    0.588</span></span>
+<span id="cb148-16"><a href="instrumental-variables-estimation.html#cb148-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb148-17"><a href="instrumental-variables-estimation.html#cb148-17" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 10.3637 on 1474 degrees of freedom</span></span></code></pre></div>
 </div>
 <div id="program-16.5" class="section level2 hasAnchor">
 <h2>Program 16.5<a href="instrumental-variables-estimation.html#program-16.5" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -508,41 +508,41 @@ <h2>Program 16.5<a href="instrumental-variables-estimation.html#program-16.5" cl
 <li>Conditional on baseline covariates</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb42"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb42-1"><a href="instrumental-variables-estimation.html#cb42-1" tabindex="-1"></a>model2 <span class="ot">&lt;-</span> <span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> smokeintensity <span class="sc">+</span> smokeyrs <span class="sc">+</span></span>
-<span id="cb42-2"><a href="instrumental-variables-estimation.html#cb42-2" tabindex="-1"></a>                      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71,</span>
-<span id="cb42-3"><a href="instrumental-variables-estimation.html#cb42-3" tabindex="-1"></a>             <span class="sc">~</span> highprice <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> smokeintensity <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span></span>
-<span id="cb42-4"><a href="instrumental-variables-estimation.html#cb42-4" tabindex="-1"></a>               <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71, <span class="at">data =</span> nhefs.iv)</span>
-<span id="cb42-5"><a href="instrumental-variables-estimation.html#cb42-5" tabindex="-1"></a><span class="fu">summary</span>(model2)</span>
-<span id="cb42-6"><a href="instrumental-variables-estimation.html#cb42-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-7"><a href="instrumental-variables-estimation.html#cb42-7" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
-<span id="cb42-8"><a href="instrumental-variables-estimation.html#cb42-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-9"><a href="instrumental-variables-estimation.html#cb42-9" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + </span></span>
-<span id="cb42-10"><a href="instrumental-variables-estimation.html#cb42-10" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71</span></span>
-<span id="cb42-11"><a href="instrumental-variables-estimation.html#cb42-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-12"><a href="instrumental-variables-estimation.html#cb42-12" tabindex="-1"></a><span class="co">#&gt; Instruments: ~highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + </span></span>
-<span id="cb42-13"><a href="instrumental-variables-estimation.html#cb42-13" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71</span></span>
-<span id="cb42-14"><a href="instrumental-variables-estimation.html#cb42-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-15"><a href="instrumental-variables-estimation.html#cb42-15" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
-<span id="cb42-16"><a href="instrumental-variables-estimation.html#cb42-16" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb42-17"><a href="instrumental-variables-estimation.html#cb42-17" tabindex="-1"></a><span class="co">#&gt;  -42.23   -4.29   -0.62    0.00    3.87   46.74 </span></span>
-<span id="cb42-18"><a href="instrumental-variables-estimation.html#cb42-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-19"><a href="instrumental-variables-estimation.html#cb42-19" tabindex="-1"></a><span class="co">#&gt;                       Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb42-20"><a href="instrumental-variables-estimation.html#cb42-20" tabindex="-1"></a><span class="co">#&gt; (Intercept)          17.280330   2.335402   7.399  2.3e-13 ***</span></span>
-<span id="cb42-21"><a href="instrumental-variables-estimation.html#cb42-21" tabindex="-1"></a><span class="co">#&gt; qsmk                 -1.042295  29.987369  -0.035   0.9723    </span></span>
-<span id="cb42-22"><a href="instrumental-variables-estimation.html#cb42-22" tabindex="-1"></a><span class="co">#&gt; sex                  -1.644393   2.630831  -0.625   0.5320    </span></span>
-<span id="cb42-23"><a href="instrumental-variables-estimation.html#cb42-23" tabindex="-1"></a><span class="co">#&gt; race                 -0.183255   4.650386  -0.039   0.9686    </span></span>
-<span id="cb42-24"><a href="instrumental-variables-estimation.html#cb42-24" tabindex="-1"></a><span class="co">#&gt; age                  -0.163640   0.240548  -0.680   0.4964    </span></span>
-<span id="cb42-25"><a href="instrumental-variables-estimation.html#cb42-25" tabindex="-1"></a><span class="co">#&gt; smokeintensity        0.005767   0.145504   0.040   0.9684    </span></span>
-<span id="cb42-26"><a href="instrumental-variables-estimation.html#cb42-26" tabindex="-1"></a><span class="co">#&gt; smokeyrs              0.025836   0.161421   0.160   0.8729    </span></span>
-<span id="cb42-27"><a href="instrumental-variables-estimation.html#cb42-27" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1  0.498748   2.171239   0.230   0.8184    </span></span>
-<span id="cb42-28"><a href="instrumental-variables-estimation.html#cb42-28" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2  0.581834   2.183148   0.267   0.7899    </span></span>
-<span id="cb42-29"><a href="instrumental-variables-estimation.html#cb42-29" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1   -1.170145   0.607466  -1.926   0.0543 .  </span></span>
-<span id="cb42-30"><a href="instrumental-variables-estimation.html#cb42-30" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2   -0.512284   1.308451  -0.392   0.6955    </span></span>
-<span id="cb42-31"><a href="instrumental-variables-estimation.html#cb42-31" tabindex="-1"></a><span class="co">#&gt; wt71                 -0.097949   0.036271  -2.701   0.0070 ** </span></span>
-<span id="cb42-32"><a href="instrumental-variables-estimation.html#cb42-32" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb42-33"><a href="instrumental-variables-estimation.html#cb42-33" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb42-34"><a href="instrumental-variables-estimation.html#cb42-34" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb42-35"><a href="instrumental-variables-estimation.html#cb42-35" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 7.7162 on 1464 degrees of freedom</span></span></code></pre></div>
+<div class="sourceCode" id="cb149"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb149-1"><a href="instrumental-variables-estimation.html#cb149-1" tabindex="-1"></a>model2 <span class="ot">&lt;-</span> <span class="fu">tsls</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> smokeintensity <span class="sc">+</span> smokeyrs <span class="sc">+</span></span>
+<span id="cb149-2"><a href="instrumental-variables-estimation.html#cb149-2" tabindex="-1"></a>                      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71,</span>
+<span id="cb149-3"><a href="instrumental-variables-estimation.html#cb149-3" tabindex="-1"></a>             <span class="sc">~</span> highprice <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> smokeintensity <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span></span>
+<span id="cb149-4"><a href="instrumental-variables-estimation.html#cb149-4" tabindex="-1"></a>               <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71, <span class="at">data =</span> nhefs.iv)</span>
+<span id="cb149-5"><a href="instrumental-variables-estimation.html#cb149-5" tabindex="-1"></a><span class="fu">summary</span>(model2)</span>
+<span id="cb149-6"><a href="instrumental-variables-estimation.html#cb149-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-7"><a href="instrumental-variables-estimation.html#cb149-7" tabindex="-1"></a><span class="co">#&gt;  2SLS Estimates</span></span>
+<span id="cb149-8"><a href="instrumental-variables-estimation.html#cb149-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-9"><a href="instrumental-variables-estimation.html#cb149-9" tabindex="-1"></a><span class="co">#&gt; Model Formula: wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + </span></span>
+<span id="cb149-10"><a href="instrumental-variables-estimation.html#cb149-10" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71</span></span>
+<span id="cb149-11"><a href="instrumental-variables-estimation.html#cb149-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-12"><a href="instrumental-variables-estimation.html#cb149-12" tabindex="-1"></a><span class="co">#&gt; Instruments: ~highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + </span></span>
+<span id="cb149-13"><a href="instrumental-variables-estimation.html#cb149-13" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71</span></span>
+<span id="cb149-14"><a href="instrumental-variables-estimation.html#cb149-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-15"><a href="instrumental-variables-estimation.html#cb149-15" tabindex="-1"></a><span class="co">#&gt; Residuals:</span></span>
+<span id="cb149-16"><a href="instrumental-variables-estimation.html#cb149-16" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb149-17"><a href="instrumental-variables-estimation.html#cb149-17" tabindex="-1"></a><span class="co">#&gt;  -42.23   -4.29   -0.62    0.00    3.87   46.74 </span></span>
+<span id="cb149-18"><a href="instrumental-variables-estimation.html#cb149-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-19"><a href="instrumental-variables-estimation.html#cb149-19" tabindex="-1"></a><span class="co">#&gt;                       Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb149-20"><a href="instrumental-variables-estimation.html#cb149-20" tabindex="-1"></a><span class="co">#&gt; (Intercept)          17.280330   2.335402   7.399  2.3e-13 ***</span></span>
+<span id="cb149-21"><a href="instrumental-variables-estimation.html#cb149-21" tabindex="-1"></a><span class="co">#&gt; qsmk                 -1.042295  29.987369  -0.035   0.9723    </span></span>
+<span id="cb149-22"><a href="instrumental-variables-estimation.html#cb149-22" tabindex="-1"></a><span class="co">#&gt; sex                  -1.644393   2.630831  -0.625   0.5320    </span></span>
+<span id="cb149-23"><a href="instrumental-variables-estimation.html#cb149-23" tabindex="-1"></a><span class="co">#&gt; race                 -0.183255   4.650386  -0.039   0.9686    </span></span>
+<span id="cb149-24"><a href="instrumental-variables-estimation.html#cb149-24" tabindex="-1"></a><span class="co">#&gt; age                  -0.163640   0.240548  -0.680   0.4964    </span></span>
+<span id="cb149-25"><a href="instrumental-variables-estimation.html#cb149-25" tabindex="-1"></a><span class="co">#&gt; smokeintensity        0.005767   0.145504   0.040   0.9684    </span></span>
+<span id="cb149-26"><a href="instrumental-variables-estimation.html#cb149-26" tabindex="-1"></a><span class="co">#&gt; smokeyrs              0.025836   0.161421   0.160   0.8729    </span></span>
+<span id="cb149-27"><a href="instrumental-variables-estimation.html#cb149-27" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1  0.498748   2.171239   0.230   0.8184    </span></span>
+<span id="cb149-28"><a href="instrumental-variables-estimation.html#cb149-28" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2  0.581834   2.183148   0.267   0.7899    </span></span>
+<span id="cb149-29"><a href="instrumental-variables-estimation.html#cb149-29" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1   -1.170145   0.607466  -1.926   0.0543 .  </span></span>
+<span id="cb149-30"><a href="instrumental-variables-estimation.html#cb149-30" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2   -0.512284   1.308451  -0.392   0.6955    </span></span>
+<span id="cb149-31"><a href="instrumental-variables-estimation.html#cb149-31" tabindex="-1"></a><span class="co">#&gt; wt71                 -0.097949   0.036271  -2.701   0.0070 ** </span></span>
+<span id="cb149-32"><a href="instrumental-variables-estimation.html#cb149-32" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb149-33"><a href="instrumental-variables-estimation.html#cb149-33" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb149-34"><a href="instrumental-variables-estimation.html#cb149-34" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb149-35"><a href="instrumental-variables-estimation.html#cb149-35" tabindex="-1"></a><span class="co">#&gt; Residual standard error: 7.7162 on 1464 degrees of freedom</span></span></code></pre></div>
 
 </div>
 </div>
diff --git a/docs/ip-weighting-and-marginal-structural-models-stata.html b/docs/ip-weighting-and-marginal-structural-models-stata.html
index fa7ff68..142e295 100644
--- a/docs/ip-weighting-and-marginal-structural-models-stata.html
+++ b/docs/ip-weighting-and-marginal-structural-models-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="ip-weighting-and-marginal-structural-models-stata" class="section level1 unnumbered hasAnchor">
 <h1>12. IP Weighting and Marginal Structural Models: Stata<a href="ip-weighting-and-marginal-structural-models-stata.html#ip-weighting-and-marginal-structural-models-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb66"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb66-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb66-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb183"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb183-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb183-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -322,41 +322,41 @@ <h2>Program 12.1<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <ul>
 <li>Descriptive statistics from NHEFS data (Table 12.1)</li>
 </ul>
-<div class="sourceCode" id="cb68"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb68-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
-<span id="cb68-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-2" tabindex="-1"></a></span>
-<span id="cb68-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-3" tabindex="-1"></a><span class="co">/*Provisionally ignore subjects with missing values for follow-up weight*/</span></span>
-<span id="cb68-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-4" tabindex="-1"></a><span class="co">/*Sample size after exclusion: N = 1566*/</span></span>
-<span id="cb68-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-5" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82==.</span>
-<span id="cb68-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-6" tabindex="-1"></a></span>
-<span id="cb68-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-7" tabindex="-1"></a><span class="co">/* Calculate mean weight change in those with and without smoking cessation*/</span></span>
-<span id="cb68-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-8" tabindex="-1"></a><span class="kw">label</span> <span class="kw">define</span> qsmk 0 <span class="st">&quot;No smoking cessation&quot;</span> 1 <span class="st">&quot;Smoking cessation&quot;</span></span>
-<span id="cb68-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-9" tabindex="-1"></a><span class="kw">label</span> <span class="kw">values</span> qsmk qsmk</span>
-<span id="cb68-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-10" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> years = <span class="kw">mean</span>(age) <span class="kw">if</span> age &lt; . </span>
-<span id="cb68-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-11" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> years <span class="st">&quot;Age, years&quot;</span></span>
-<span id="cb68-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-12" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> male = <span class="kw">mean</span>(100 * (sex==0)) <span class="kw">if</span> sex &lt; . </span>
-<span id="cb68-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-13" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> male <span class="st">&quot;Men, %&quot;</span></span>
-<span id="cb68-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-14" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> <span class="bn">white</span> = <span class="kw">mean</span>(100 * (race==0)) <span class="kw">if</span> race &lt; . </span>
-<span id="cb68-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-15" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> <span class="bn">white</span> <span class="st">&quot;White, %&quot;</span></span>
-<span id="cb68-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-16" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> university = <span class="kw">mean</span>(100 * (education == 5)) <span class="kw">if</span> education &lt; .</span>
-<span id="cb68-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-17" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> university <span class="st">&quot;University, %&quot;</span></span>
-<span id="cb68-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-18" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> kg = <span class="kw">mean</span>(wt71) <span class="kw">if</span> wt71 &lt; .</span>
-<span id="cb68-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-19" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> kg <span class="st">&quot;Weight, kg&quot;</span></span>
-<span id="cb68-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-20" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> cigs = <span class="kw">mean</span>(smokeintensity) <span class="kw">if</span> smokeintensity &lt; . </span>
-<span id="cb68-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-21" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> cigs <span class="st">&quot;Cigarettes/day&quot;</span></span>
-<span id="cb68-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-22" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> meansmkyrs = <span class="kw">mean</span>(smokeyrs) <span class="kw">if</span> smokeyrs &lt; .</span>
-<span id="cb68-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-23" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> kg <span class="st">&quot;Years smoking&quot;</span></span>
-<span id="cb68-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-24" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> noexer = <span class="kw">mean</span>(100 * (exercise == 2)) <span class="kw">if</span> exercise &lt; . </span>
-<span id="cb68-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-25" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> noexer <span class="st">&quot;Little/no exercise&quot;</span></span>
-<span id="cb68-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-26" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> inactive = <span class="kw">mean</span>(100 * (active==2)) <span class="kw">if</span> active &lt; . </span>
-<span id="cb68-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-27" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> inactive <span class="st">&quot;Inactive daily life&quot;</span></span>
-<span id="cb68-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb68-28" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb185"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb185-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
+<span id="cb185-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-2" tabindex="-1"></a></span>
+<span id="cb185-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-3" tabindex="-1"></a><span class="co">/*Provisionally ignore subjects with missing values for follow-up weight*/</span></span>
+<span id="cb185-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-4" tabindex="-1"></a><span class="co">/*Sample size after exclusion: N = 1566*/</span></span>
+<span id="cb185-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-5" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82==.</span>
+<span id="cb185-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-6" tabindex="-1"></a></span>
+<span id="cb185-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-7" tabindex="-1"></a><span class="co">/* Calculate mean weight change in those with and without smoking cessation*/</span></span>
+<span id="cb185-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-8" tabindex="-1"></a><span class="kw">label</span> <span class="kw">define</span> qsmk 0 <span class="st">&quot;No smoking cessation&quot;</span> 1 <span class="st">&quot;Smoking cessation&quot;</span></span>
+<span id="cb185-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-9" tabindex="-1"></a><span class="kw">label</span> <span class="kw">values</span> qsmk qsmk</span>
+<span id="cb185-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-10" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> years = <span class="kw">mean</span>(age) <span class="kw">if</span> age &lt; . </span>
+<span id="cb185-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-11" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> years <span class="st">&quot;Age, years&quot;</span></span>
+<span id="cb185-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-12" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> male = <span class="kw">mean</span>(100 * (sex==0)) <span class="kw">if</span> sex &lt; . </span>
+<span id="cb185-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-13" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> male <span class="st">&quot;Men, %&quot;</span></span>
+<span id="cb185-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-14" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> <span class="bn">white</span> = <span class="kw">mean</span>(100 * (race==0)) <span class="kw">if</span> race &lt; . </span>
+<span id="cb185-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-15" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> <span class="bn">white</span> <span class="st">&quot;White, %&quot;</span></span>
+<span id="cb185-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-16" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> university = <span class="kw">mean</span>(100 * (education == 5)) <span class="kw">if</span> education &lt; .</span>
+<span id="cb185-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-17" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> university <span class="st">&quot;University, %&quot;</span></span>
+<span id="cb185-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-18" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> kg = <span class="kw">mean</span>(wt71) <span class="kw">if</span> wt71 &lt; .</span>
+<span id="cb185-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-19" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> kg <span class="st">&quot;Weight, kg&quot;</span></span>
+<span id="cb185-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-20" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> cigs = <span class="kw">mean</span>(smokeintensity) <span class="kw">if</span> smokeintensity &lt; . </span>
+<span id="cb185-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-21" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> cigs <span class="st">&quot;Cigarettes/day&quot;</span></span>
+<span id="cb185-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-22" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> meansmkyrs = <span class="kw">mean</span>(smokeyrs) <span class="kw">if</span> smokeyrs &lt; .</span>
+<span id="cb185-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-23" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> kg <span class="st">&quot;Years smoking&quot;</span></span>
+<span id="cb185-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-24" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> noexer = <span class="kw">mean</span>(100 * (exercise == 2)) <span class="kw">if</span> exercise &lt; . </span>
+<span id="cb185-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-25" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> noexer <span class="st">&quot;Little/no exercise&quot;</span></span>
+<span id="cb185-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-26" tabindex="-1"></a><span class="kw">by</span> qsmk, <span class="kw">sort</span>: <span class="kw">egen</span> inactive = <span class="kw">mean</span>(100 * (active==2)) <span class="kw">if</span> active &lt; . </span>
+<span id="cb185-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-27" tabindex="-1"></a><span class="kw">label</span> <span class="kw">var</span> inactive <span class="st">&quot;Inactive daily life&quot;</span></span>
+<span id="cb185-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb185-28" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>(63 observations deleted)</code></pre>
-<div class="sourceCode" id="cb70"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb70-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb70-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-2" tabindex="-1"></a></span>
-<span id="cb70-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-3" tabindex="-1"></a><span class="co">/*Output table*/</span></span>
-<span id="cb70-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-4" tabindex="-1"></a><span class="kw">foreach</span> <span class="kw">var</span> <span class="kw">of</span> <span class="kw">varlist</span> years male  <span class="bn">white</span> university kg cigs meansmkyrs noexer inactive {</span>
-<span id="cb70-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-5" tabindex="-1"></a>  tabdisp qsmk, cell(<span class="ot">`var&#39;</span>) <span class="kw">format</span>(%3.1f)</span>
-<span id="cb70-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb70-6" tabindex="-1"></a>}</span></code></pre></div>
+<div class="sourceCode" id="cb187"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb187-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb187-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-2" tabindex="-1"></a></span>
+<span id="cb187-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-3" tabindex="-1"></a><span class="co">/*Output table*/</span></span>
+<span id="cb187-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-4" tabindex="-1"></a><span class="kw">foreach</span> <span class="kw">var</span> <span class="kw">of</span> <span class="kw">varlist</span> years male  <span class="bn">white</span> university kg cigs meansmkyrs noexer inactive {</span>
+<span id="cb187-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-5" tabindex="-1"></a>  tabdisp qsmk, cell(<span class="ot">`var&#39;</span>) <span class="kw">format</span>(%3.1f)</span>
+<span id="cb187-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb187-6" tabindex="-1"></a>}</span></code></pre></div>
 <pre><code>  2.   tabdisp qsmk, cell(`var&#39;) format(%3.1f)
   3. }
 
@@ -438,27 +438,27 @@ <h2>Program 12.2<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Estimating IP weights for Section 12.2</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb72"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb72-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb72-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-2" tabindex="-1"></a></span>
-<span id="cb72-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-3" tabindex="-1"></a><span class="co">/*Fit a logistic model for the IP weights*/</span> </span>
-<span id="cb72-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb72-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-5" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb72-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-6" tabindex="-1"></a></span>
-<span id="cb72-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-7" tabindex="-1"></a><span class="co">/*Output predicted conditional probability of quitting smoking for each individual*/</span></span>
-<span id="cb72-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-8" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
-<span id="cb72-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-9" tabindex="-1"></a></span>
-<span id="cb72-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-10" tabindex="-1"></a><span class="co">/*Generate nonstabilized weights as P(A=1|covariates) if A = 1 and */</span></span>
-<span id="cb72-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-11" tabindex="-1"></a><span class="co">/* 1-P(A=1|covariates) if A = 0*/</span></span>
-<span id="cb72-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-12" tabindex="-1"></a><span class="kw">gen</span> <span class="fu">w</span>=.</span>
-<span id="cb72-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-13" tabindex="-1"></a><span class="kw">replace</span> <span class="fu">w</span>=1/p_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb72-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-14" tabindex="-1"></a><span class="kw">replace</span> <span class="fu">w</span>=1/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb72-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-15" tabindex="-1"></a><span class="co">/*Check the mean of the weights; we expect it to be close to 2.0*/</span></span>
-<span id="cb72-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-16" tabindex="-1"></a><span class="kw">summarize</span> <span class="fu">w</span></span>
-<span id="cb72-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-17" tabindex="-1"></a></span>
-<span id="cb72-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-18" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
-<span id="cb72-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-19" tabindex="-1"></a><span class="co">/*Weights assigned using pweight = w*/</span></span>
-<span id="cb72-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-20" tabindex="-1"></a><span class="co">/*Robust standard errors using cluster() option where &#39;seqn&#39; is the ID variable*/</span></span>
-<span id="cb72-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb72-21" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [<span class="kw">pweight</span>=<span class="fu">w</span>], <span class="kw">cluster</span>(seqn) </span></code></pre></div>
+<div class="sourceCode" id="cb189"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb189-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb189-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-2" tabindex="-1"></a></span>
+<span id="cb189-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-3" tabindex="-1"></a><span class="co">/*Fit a logistic model for the IP weights*/</span> </span>
+<span id="cb189-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb189-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-5" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb189-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-6" tabindex="-1"></a></span>
+<span id="cb189-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-7" tabindex="-1"></a><span class="co">/*Output predicted conditional probability of quitting smoking for each individual*/</span></span>
+<span id="cb189-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-8" tabindex="-1"></a><span class="kw">predict</span> p_qsmk, pr</span>
+<span id="cb189-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-9" tabindex="-1"></a></span>
+<span id="cb189-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-10" tabindex="-1"></a><span class="co">/*Generate nonstabilized weights as P(A=1|covariates) if A = 1 and */</span></span>
+<span id="cb189-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-11" tabindex="-1"></a><span class="co">/* 1-P(A=1|covariates) if A = 0*/</span></span>
+<span id="cb189-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-12" tabindex="-1"></a><span class="kw">gen</span> <span class="fu">w</span>=.</span>
+<span id="cb189-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-13" tabindex="-1"></a><span class="kw">replace</span> <span class="fu">w</span>=1/p_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb189-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-14" tabindex="-1"></a><span class="kw">replace</span> <span class="fu">w</span>=1/(1-p_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb189-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-15" tabindex="-1"></a><span class="co">/*Check the mean of the weights; we expect it to be close to 2.0*/</span></span>
+<span id="cb189-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-16" tabindex="-1"></a><span class="kw">summarize</span> <span class="fu">w</span></span>
+<span id="cb189-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-17" tabindex="-1"></a></span>
+<span id="cb189-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-18" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
+<span id="cb189-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-19" tabindex="-1"></a><span class="co">/*Weights assigned using pweight = w*/</span></span>
+<span id="cb189-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-20" tabindex="-1"></a><span class="co">/*Robust standard errors using cluster() option where &#39;seqn&#39; is the ID variable*/</span></span>
+<span id="cb189-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb189-21" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [<span class="kw">pweight</span>=<span class="fu">w</span>], <span class="kw">cluster</span>(seqn) </span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -893.02712  
 Iteration 1:  Log likelihood = -839.70016  
 Iteration 2:  Log likelihood = -838.45045  
@@ -544,37 +544,37 @@ <h2>Program 12.3<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Estimating stabilized IP weights for Section 12.3</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb74"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb74-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb74-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-2" tabindex="-1"></a></span>
-<span id="cb74-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-3" tabindex="-1"></a><span class="co">/*Fit a logistic model for the denominator of the IP weights and predict the */</span></span>
-<span id="cb74-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-4" tabindex="-1"></a><span class="co">/* conditional probability of smoking */</span></span>
-<span id="cb74-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-5" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb74-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-6" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71  </span>
-<span id="cb74-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-7" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
-<span id="cb74-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-8" tabindex="-1"></a></span>
-<span id="cb74-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-9" tabindex="-1"></a><span class="co">/*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */</span> </span>
-<span id="cb74-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-10" tabindex="-1"></a><span class="kw">logit</span> qsmk </span>
-<span id="cb74-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-11" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
-<span id="cb74-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-12" tabindex="-1"></a></span>
-<span id="cb74-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-13" tabindex="-1"></a><span class="co">/*Generate stabilized weights as f(A)/f(A|L)*/</span></span>
-<span id="cb74-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-14" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
-<span id="cb74-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-15" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb74-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-16" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb74-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-17" tabindex="-1"></a></span>
-<span id="cb74-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-18" tabindex="-1"></a><span class="co">/*Check distribution of the stabilized weights*/</span></span>
-<span id="cb74-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-19" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
-<span id="cb74-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-20" tabindex="-1"></a></span>
-<span id="cb74-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-21" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
-<span id="cb74-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-22" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn) </span>
-<span id="cb74-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-23" tabindex="-1"></a></span>
-<span id="cb74-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-24" tabindex="-1"></a><span class="co">/**********************************************************</span></span>
-<span id="cb74-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-25" tabindex="-1"></a><span class="co">FINE POINT 12.2</span></span>
-<span id="cb74-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-26" tabindex="-1"></a><span class="co">Checking positivity</span></span>
-<span id="cb74-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-27" tabindex="-1"></a><span class="co">**********************************************************/</span></span>
-<span id="cb74-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-28" tabindex="-1"></a></span>
-<span id="cb74-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-29" tabindex="-1"></a><span class="co">/*Check for missing values within strata of covariates, for example: */</span></span>
-<span id="cb74-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-30" tabindex="-1"></a><span class="kw">tab</span> age qsmk <span class="kw">if</span> race==0 &amp; sex==1 &amp; wt82!=.</span>
-<span id="cb74-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb74-31" tabindex="-1"></a><span class="kw">tab</span> age qsmk <span class="kw">if</span> race==1 &amp; sex==1 &amp; wt82!=.</span></code></pre></div>
+<div class="sourceCode" id="cb191"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb191-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb191-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-2" tabindex="-1"></a></span>
+<span id="cb191-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-3" tabindex="-1"></a><span class="co">/*Fit a logistic model for the denominator of the IP weights and predict the */</span></span>
+<span id="cb191-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-4" tabindex="-1"></a><span class="co">/* conditional probability of smoking */</span></span>
+<span id="cb191-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-5" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb191-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-6" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71  </span>
+<span id="cb191-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-7" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
+<span id="cb191-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-8" tabindex="-1"></a></span>
+<span id="cb191-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-9" tabindex="-1"></a><span class="co">/*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */</span> </span>
+<span id="cb191-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-10" tabindex="-1"></a><span class="kw">logit</span> qsmk </span>
+<span id="cb191-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-11" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
+<span id="cb191-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-12" tabindex="-1"></a></span>
+<span id="cb191-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-13" tabindex="-1"></a><span class="co">/*Generate stabilized weights as f(A)/f(A|L)*/</span></span>
+<span id="cb191-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-14" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
+<span id="cb191-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-15" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb191-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-16" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb191-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-17" tabindex="-1"></a></span>
+<span id="cb191-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-18" tabindex="-1"></a><span class="co">/*Check distribution of the stabilized weights*/</span></span>
+<span id="cb191-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-19" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
+<span id="cb191-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-20" tabindex="-1"></a></span>
+<span id="cb191-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-21" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
+<span id="cb191-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-22" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn) </span>
+<span id="cb191-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-23" tabindex="-1"></a></span>
+<span id="cb191-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-24" tabindex="-1"></a><span class="co">/**********************************************************</span></span>
+<span id="cb191-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-25" tabindex="-1"></a><span class="co">FINE POINT 12.2</span></span>
+<span id="cb191-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-26" tabindex="-1"></a><span class="co">Checking positivity</span></span>
+<span id="cb191-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-27" tabindex="-1"></a><span class="co">**********************************************************/</span></span>
+<span id="cb191-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-28" tabindex="-1"></a></span>
+<span id="cb191-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-29" tabindex="-1"></a><span class="co">/*Check for missing values within strata of covariates, for example: */</span></span>
+<span id="cb191-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-30" tabindex="-1"></a><span class="kw">tab</span> age qsmk <span class="kw">if</span> race==0 &amp; sex==1 &amp; wt82!=.</span>
+<span id="cb191-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb191-31" tabindex="-1"></a><span class="kw">tab</span> age qsmk <span class="kw">if</span> race==1 &amp; sex==1 &amp; wt82!=.</span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -893.02712  
 Iteration 1:  Log likelihood = -839.70016  
 Iteration 2:  Log likelihood = -838.45045  
@@ -775,48 +775,48 @@ <h2>Program 12.4<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS</li>
 <li>Section 12.4</li>
 </ul>
-<div class="sourceCode" id="cb76"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb76-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb76-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-2" tabindex="-1"></a></span>
-<span id="cb76-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-3" tabindex="-1"></a>* <span class="kw">drop</span> sw_a</span>
-<span id="cb76-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-4" tabindex="-1"></a></span>
-<span id="cb76-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-5" tabindex="-1"></a><span class="co">/*Analysis restricted to subjects reporting &lt;=25 cig/day at baseline: N = 1162*/</span></span>
-<span id="cb76-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-6" tabindex="-1"></a><span class="kw">keep</span> <span class="kw">if</span> smokeintensity &lt;=25</span>
-<span id="cb76-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-7" tabindex="-1"></a></span>
-<span id="cb76-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-8" tabindex="-1"></a><span class="co">/*Fit a linear model for the denominator of the IP weights and calculate the */</span></span>
-<span id="cb76-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-9" tabindex="-1"></a><span class="co">/* mean expected smoking intensity*/</span> </span>
-<span id="cb76-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-10" tabindex="-1"></a><span class="kw">regress</span> smkintensity82_71 sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb76-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-11" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb76-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-12" tabindex="-1"></a>ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71</span>
-<span id="cb76-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-13" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">predict</span> p_den</span>
-<span id="cb76-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-14" tabindex="-1"></a></span>
-<span id="cb76-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-15" tabindex="-1"></a><span class="co">/*Generate the denisty of the denomiator expectation using the mean expected */</span></span>
-<span id="cb76-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-16" tabindex="-1"></a><span class="co">/* smoking intensity and the residuals, assuming a normal distribution*/</span></span>
-<span id="cb76-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-17" tabindex="-1"></a><span class="co">/*Note: The regress command in Stata saves the root mean squared error for the */</span></span>
-<span id="cb76-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-18" tabindex="-1"></a><span class="co">/* immediate regression as e(rmse), thus there is no need to calculate it again. */</span></span>
-<span id="cb76-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-19" tabindex="-1"></a><span class="kw">gen</span> dens_den = <span class="fu">normalden</span>(smkintensity82_71, p_den, <span class="fu">e</span>(rmse))</span>
-<span id="cb76-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-20" tabindex="-1"></a></span>
-<span id="cb76-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-21" tabindex="-1"></a><span class="co">/*Fit a linear model for the numerator of ip weights, calculate the mean */</span></span>
-<span id="cb76-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-22" tabindex="-1"></a><span class="co">/* expected value, and generate the density*/</span></span>
-<span id="cb76-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-23" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">regress</span> smkintensity82_71</span>
-<span id="cb76-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-24" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">predict</span> p_num</span>
-<span id="cb76-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-25" tabindex="-1"></a><span class="kw">gen</span> dens_num = <span class="fu">normalden</span>( smkintensity82_71, p_num, <span class="fu">e</span>(rmse))</span>
-<span id="cb76-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-26" tabindex="-1"></a></span>
-<span id="cb76-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-27" tabindex="-1"></a><span class="co">/*Generate the final stabilized weights from the estimated numerator and */</span></span>
-<span id="cb76-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-28" tabindex="-1"></a><span class="co">/* denominator, and check the weights distribution*/</span></span>
-<span id="cb76-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-29" tabindex="-1"></a><span class="kw">gen</span> sw_a=dens_num/dens_den</span>
-<span id="cb76-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-30" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
-<span id="cb76-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-31" tabindex="-1"></a></span>
-<span id="cb76-32"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-32" tabindex="-1"></a><span class="co">/*Fit a marginal structural model in the pseudopopulation*/</span></span>
-<span id="cb76-33"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-33" tabindex="-1"></a><span class="kw">regress</span> wt82_71  c.smkintensity82_71##c.smkintensity82_71 [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn)</span>
-<span id="cb76-34"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-34" tabindex="-1"></a></span>
-<span id="cb76-35"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-35" tabindex="-1"></a><span class="co">/*Output the estimated mean Y value when smoke intensity is unchanged from */</span></span>
-<span id="cb76-36"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-36" tabindex="-1"></a><span class="co">/* baseline to 1982 */</span></span>
-<span id="cb76-37"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-37" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>]</span>
-<span id="cb76-38"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-38" tabindex="-1"></a></span>
-<span id="cb76-39"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-39" tabindex="-1"></a><span class="co">/*Output the estimated mean Y value when smoke intensity increases by 20 from */</span></span>
-<span id="cb76-40"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-40" tabindex="-1"></a><span class="co">/* baseline to 1982*/</span></span>
-<span id="cb76-41"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-41" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 20*_b[smkintensity82_71 ] + <span class="co">///</span></span>
-<span id="cb76-42"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb76-42" tabindex="-1"></a>  400*_b[c.smkintensity82_71#c.smkintensity82_71]</span></code></pre></div>
+<div class="sourceCode" id="cb193"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb193-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb193-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-2" tabindex="-1"></a></span>
+<span id="cb193-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-3" tabindex="-1"></a>* <span class="kw">drop</span> sw_a</span>
+<span id="cb193-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-4" tabindex="-1"></a></span>
+<span id="cb193-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-5" tabindex="-1"></a><span class="co">/*Analysis restricted to subjects reporting &lt;=25 cig/day at baseline: N = 1162*/</span></span>
+<span id="cb193-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-6" tabindex="-1"></a><span class="kw">keep</span> <span class="kw">if</span> smokeintensity &lt;=25</span>
+<span id="cb193-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-7" tabindex="-1"></a></span>
+<span id="cb193-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-8" tabindex="-1"></a><span class="co">/*Fit a linear model for the denominator of the IP weights and calculate the */</span></span>
+<span id="cb193-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-9" tabindex="-1"></a><span class="co">/* mean expected smoking intensity*/</span> </span>
+<span id="cb193-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-10" tabindex="-1"></a><span class="kw">regress</span> smkintensity82_71 sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb193-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-11" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb193-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-12" tabindex="-1"></a>ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71</span>
+<span id="cb193-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-13" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">predict</span> p_den</span>
+<span id="cb193-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-14" tabindex="-1"></a></span>
+<span id="cb193-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-15" tabindex="-1"></a><span class="co">/*Generate the denisty of the denomiator expectation using the mean expected */</span></span>
+<span id="cb193-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-16" tabindex="-1"></a><span class="co">/* smoking intensity and the residuals, assuming a normal distribution*/</span></span>
+<span id="cb193-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-17" tabindex="-1"></a><span class="co">/*Note: The regress command in Stata saves the root mean squared error for the */</span></span>
+<span id="cb193-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-18" tabindex="-1"></a><span class="co">/* immediate regression as e(rmse), thus there is no need to calculate it again. */</span></span>
+<span id="cb193-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-19" tabindex="-1"></a><span class="kw">gen</span> dens_den = <span class="fu">normalden</span>(smkintensity82_71, p_den, <span class="fu">e</span>(rmse))</span>
+<span id="cb193-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-20" tabindex="-1"></a></span>
+<span id="cb193-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-21" tabindex="-1"></a><span class="co">/*Fit a linear model for the numerator of ip weights, calculate the mean */</span></span>
+<span id="cb193-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-22" tabindex="-1"></a><span class="co">/* expected value, and generate the density*/</span></span>
+<span id="cb193-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-23" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">regress</span> smkintensity82_71</span>
+<span id="cb193-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-24" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">predict</span> p_num</span>
+<span id="cb193-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-25" tabindex="-1"></a><span class="kw">gen</span> dens_num = <span class="fu">normalden</span>( smkintensity82_71, p_num, <span class="fu">e</span>(rmse))</span>
+<span id="cb193-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-26" tabindex="-1"></a></span>
+<span id="cb193-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-27" tabindex="-1"></a><span class="co">/*Generate the final stabilized weights from the estimated numerator and */</span></span>
+<span id="cb193-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-28" tabindex="-1"></a><span class="co">/* denominator, and check the weights distribution*/</span></span>
+<span id="cb193-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-29" tabindex="-1"></a><span class="kw">gen</span> sw_a=dens_num/dens_den</span>
+<span id="cb193-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-30" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
+<span id="cb193-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-31" tabindex="-1"></a></span>
+<span id="cb193-32"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-32" tabindex="-1"></a><span class="co">/*Fit a marginal structural model in the pseudopopulation*/</span></span>
+<span id="cb193-33"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-33" tabindex="-1"></a><span class="kw">regress</span> wt82_71  c.smkintensity82_71##c.smkintensity82_71 [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn)</span>
+<span id="cb193-34"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-34" tabindex="-1"></a></span>
+<span id="cb193-35"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-35" tabindex="-1"></a><span class="co">/*Output the estimated mean Y value when smoke intensity is unchanged from */</span></span>
+<span id="cb193-36"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-36" tabindex="-1"></a><span class="co">/* baseline to 1982 */</span></span>
+<span id="cb193-37"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-37" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>]</span>
+<span id="cb193-38"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-38" tabindex="-1"></a></span>
+<span id="cb193-39"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-39" tabindex="-1"></a><span class="co">/*Output the estimated mean Y value when smoke intensity increases by 20 from */</span></span>
+<span id="cb193-40"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-40" tabindex="-1"></a><span class="co">/* baseline to 1982*/</span></span>
+<span id="cb193-41"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-41" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 20*_b[smkintensity82_71 ] + <span class="co">///</span></span>
+<span id="cb193-42"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb193-42" tabindex="-1"></a>  400*_b[c.smkintensity82_71#c.smkintensity82_71]</span></code></pre></div>
 <pre><code>(404 observations deleted)
 
       Source |       SS           df       MS      Number of obs   =     1,162
@@ -917,33 +917,33 @@ <h2>Program 12.5<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Data from NHEFS</li>
 <li>Section 12.4</li>
 </ul>
-<div class="sourceCode" id="cb78"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb78-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
-<span id="cb78-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-2" tabindex="-1"></a></span>
-<span id="cb78-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-3" tabindex="-1"></a><span class="co">/*Provisionally ignore subjects with missing values for follow-up weight*/</span></span>
-<span id="cb78-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-4" tabindex="-1"></a><span class="co">/*Sample size after exclusion: N = 1566*/</span></span>
-<span id="cb78-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-5" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82==.</span>
-<span id="cb78-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-6" tabindex="-1"></a></span>
-<span id="cb78-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-7" tabindex="-1"></a><span class="co">/*Estimate the stabilized weights for quitting smoking as in PROGRAM 12.3*/</span></span>
-<span id="cb78-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-8" tabindex="-1"></a><span class="co">/*Fit a logistic model for the denominator of the IP weights and predict the */</span></span>
-<span id="cb78-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-9" tabindex="-1"></a><span class="co">/* conditional probability of smoking*/</span> </span>
-<span id="cb78-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-10" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb78-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-11" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71  </span>
-<span id="cb78-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-12" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
-<span id="cb78-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-13" tabindex="-1"></a><span class="co">/*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */</span> </span>
-<span id="cb78-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-14" tabindex="-1"></a><span class="kw">logit</span> qsmk </span>
-<span id="cb78-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-15" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
-<span id="cb78-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-16" tabindex="-1"></a><span class="co">/*Generate stabilized weights as f(A)/f(A|L)*/</span></span>
-<span id="cb78-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-17" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
-<span id="cb78-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-18" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb78-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-19" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb78-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-20" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
-<span id="cb78-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-21" tabindex="-1"></a></span>
-<span id="cb78-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-22" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
-<span id="cb78-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-23" tabindex="-1"></a><span class="co">/*</span><span class="al">NOTE</span><span class="co">: Stata has two commands for logistic regression, logit and logistic*/</span></span>
-<span id="cb78-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-24" tabindex="-1"></a><span class="co">/*Using logistic allows us to output the odds ratios directly*/</span></span>
-<span id="cb78-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-25" tabindex="-1"></a><span class="co">/*We can also output odds ratios from the logit command using the or option */</span></span>
-<span id="cb78-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-26" tabindex="-1"></a><span class="co">/* (default logit output is regression coefficients*/</span></span>
-<span id="cb78-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb78-27" tabindex="-1"></a><span class="kw">logistic</span> death qsmk [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn) </span></code></pre></div>
+<div class="sourceCode" id="cb195"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb195-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
+<span id="cb195-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-2" tabindex="-1"></a></span>
+<span id="cb195-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-3" tabindex="-1"></a><span class="co">/*Provisionally ignore subjects with missing values for follow-up weight*/</span></span>
+<span id="cb195-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-4" tabindex="-1"></a><span class="co">/*Sample size after exclusion: N = 1566*/</span></span>
+<span id="cb195-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-5" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> wt82==.</span>
+<span id="cb195-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-6" tabindex="-1"></a></span>
+<span id="cb195-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-7" tabindex="-1"></a><span class="co">/*Estimate the stabilized weights for quitting smoking as in PROGRAM 12.3*/</span></span>
+<span id="cb195-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-8" tabindex="-1"></a><span class="co">/*Fit a logistic model for the denominator of the IP weights and predict the */</span></span>
+<span id="cb195-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-9" tabindex="-1"></a><span class="co">/* conditional probability of smoking*/</span> </span>
+<span id="cb195-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-10" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb195-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-11" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71  </span>
+<span id="cb195-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-12" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
+<span id="cb195-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-13" tabindex="-1"></a><span class="co">/*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */</span> </span>
+<span id="cb195-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-14" tabindex="-1"></a><span class="kw">logit</span> qsmk </span>
+<span id="cb195-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-15" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
+<span id="cb195-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-16" tabindex="-1"></a><span class="co">/*Generate stabilized weights as f(A)/f(A|L)*/</span></span>
+<span id="cb195-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-17" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
+<span id="cb195-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-18" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb195-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-19" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb195-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-20" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
+<span id="cb195-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-21" tabindex="-1"></a></span>
+<span id="cb195-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-22" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
+<span id="cb195-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-23" tabindex="-1"></a><span class="co">/*</span><span class="al">NOTE</span><span class="co">: Stata has two commands for logistic regression, logit and logistic*/</span></span>
+<span id="cb195-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-24" tabindex="-1"></a><span class="co">/*Using logistic allows us to output the odds ratios directly*/</span></span>
+<span id="cb195-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-25" tabindex="-1"></a><span class="co">/*We can also output odds ratios from the logit command using the or option */</span></span>
+<span id="cb195-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-26" tabindex="-1"></a><span class="co">/* (default logit output is regression coefficients*/</span></span>
+<span id="cb195-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb195-27" tabindex="-1"></a><span class="kw">logistic</span> death qsmk [<span class="kw">pweight</span>=sw_a], <span class="kw">cluster</span>(seqn) </span></code></pre></div>
 <pre><code>(63 observations deleted)
 
 
@@ -1048,32 +1048,32 @@ <h2>Program 12.6<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Data from NHEFS</li>
 <li>Section 12.5</li>
 </ul>
-<div class="sourceCode" id="cb80"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb80-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
-<span id="cb80-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-2" tabindex="-1"></a></span>
-<span id="cb80-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-3" tabindex="-1"></a>* <span class="kw">drop</span> pd_qsmk pn_qsmk sw_a</span>
-<span id="cb80-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-4" tabindex="-1"></a></span>
-<span id="cb80-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-5" tabindex="-1"></a><span class="co">/*Check distribution of sex*/</span></span>
-<span id="cb80-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-6" tabindex="-1"></a><span class="kw">tab</span> sex</span>
-<span id="cb80-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-7" tabindex="-1"></a></span>
-<span id="cb80-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-8" tabindex="-1"></a><span class="co">/*Fit logistc model for the denominator of IP weights, as in PROGRAM 12.3 */</span></span>
-<span id="cb80-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-9" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb80-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-10" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb80-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-11" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
-<span id="cb80-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-12" tabindex="-1"></a></span>
-<span id="cb80-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-13" tabindex="-1"></a><span class="co">/*Fit logistic model for the numerator of IP weights, no including sex */</span></span>
-<span id="cb80-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-14" tabindex="-1"></a><span class="kw">logit</span> qsmk sex</span>
-<span id="cb80-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-15" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
-<span id="cb80-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-16" tabindex="-1"></a></span>
-<span id="cb80-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-17" tabindex="-1"></a><span class="co">/*Generate IP weights as before*/</span></span>
-<span id="cb80-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-18" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
-<span id="cb80-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-19" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb80-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-20" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb80-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-21" tabindex="-1"></a></span>
-<span id="cb80-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-22" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
-<span id="cb80-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-23" tabindex="-1"></a></span>
-<span id="cb80-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-24" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation, including interaction */</span></span>
-<span id="cb80-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-25" tabindex="-1"></a><span class="co">/* term between quitting smoking and sex*/</span></span>
-<span id="cb80-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb80-26" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##sex [pw=sw_a], <span class="kw">cluster</span>(seqn)</span></code></pre></div>
+<div class="sourceCode" id="cb197"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb197-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
+<span id="cb197-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-2" tabindex="-1"></a></span>
+<span id="cb197-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-3" tabindex="-1"></a>* <span class="kw">drop</span> pd_qsmk pn_qsmk sw_a</span>
+<span id="cb197-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-4" tabindex="-1"></a></span>
+<span id="cb197-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-5" tabindex="-1"></a><span class="co">/*Check distribution of sex*/</span></span>
+<span id="cb197-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-6" tabindex="-1"></a><span class="kw">tab</span> sex</span>
+<span id="cb197-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-7" tabindex="-1"></a></span>
+<span id="cb197-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-8" tabindex="-1"></a><span class="co">/*Fit logistc model for the denominator of IP weights, as in PROGRAM 12.3 */</span></span>
+<span id="cb197-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-9" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb197-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-10" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb197-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-11" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
+<span id="cb197-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-12" tabindex="-1"></a></span>
+<span id="cb197-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-13" tabindex="-1"></a><span class="co">/*Fit logistic model for the numerator of IP weights, no including sex */</span></span>
+<span id="cb197-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-14" tabindex="-1"></a><span class="kw">logit</span> qsmk sex</span>
+<span id="cb197-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-15" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
+<span id="cb197-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-16" tabindex="-1"></a></span>
+<span id="cb197-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-17" tabindex="-1"></a><span class="co">/*Generate IP weights as before*/</span></span>
+<span id="cb197-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-18" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
+<span id="cb197-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-19" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb197-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-20" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb197-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-21" tabindex="-1"></a></span>
+<span id="cb197-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-22" tabindex="-1"></a><span class="kw">summarize</span> sw_a</span>
+<span id="cb197-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-23" tabindex="-1"></a></span>
+<span id="cb197-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-24" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation, including interaction */</span></span>
+<span id="cb197-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-25" tabindex="-1"></a><span class="co">/* term between quitting smoking and sex*/</span></span>
+<span id="cb197-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb197-26" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##sex [pw=sw_a], <span class="kw">cluster</span>(seqn)</span></code></pre></div>
 <pre><code>        sex |      Freq.     Percent        Cum.
 ------------+-----------------------------------
           0 |        799       49.05       49.05
@@ -1192,55 +1192,55 @@ <h2>Program 12.7<a href="ip-weighting-and-marginal-structural-models-stata.html#
 <li>Data from NHEFS</li>
 <li>Section 12.6</li>
 </ul>
-<div class="sourceCode" id="cb82"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb82-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
-<span id="cb82-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-2" tabindex="-1"></a></span>
-<span id="cb82-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-3" tabindex="-1"></a><span class="co">/*Analysis including all individuals regardless of missing wt82 status: N=1629*/</span></span>
-<span id="cb82-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-4" tabindex="-1"></a><span class="co">/*Generate censoring indicator: C = 1 if wt82 missing*/</span></span>
-<span id="cb82-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-5" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> cens = (wt82 == .)</span>
-<span id="cb82-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-6" tabindex="-1"></a></span>
-<span id="cb82-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-7" tabindex="-1"></a><span class="co">/*Check distribution of censoring by quitting smoking and baseline weight*/</span></span>
-<span id="cb82-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-8" tabindex="-1"></a><span class="kw">tab</span> cens qsmk, column</span>
-<span id="cb82-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-9" tabindex="-1"></a><span class="kw">bys</span> cens: <span class="kw">summarize</span> wt71</span>
-<span id="cb82-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-10" tabindex="-1"></a></span>
-<span id="cb82-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-11" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the  denominator of IP weight for A*/</span></span>
-<span id="cb82-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-12" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb82-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-13" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb82-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-14" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
-<span id="cb82-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-15" tabindex="-1"></a></span>
-<span id="cb82-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-16" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the numerator of IP weights for A*/</span></span>
-<span id="cb82-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-17" tabindex="-1"></a><span class="kw">logit</span> qsmk</span>
-<span id="cb82-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-18" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
-<span id="cb82-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-19" tabindex="-1"></a></span>
-<span id="cb82-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-20" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the denominator of IP weights for C, */</span></span>
-<span id="cb82-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-21" tabindex="-1"></a><span class="co">/* including quitting smoking*/</span></span>
-<span id="cb82-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-22" tabindex="-1"></a><span class="kw">logit</span> cens qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb82-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-23" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
-<span id="cb82-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-24" tabindex="-1"></a>ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb82-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-25" tabindex="-1"></a><span class="kw">predict</span> pd_cens, pr</span>
-<span id="cb82-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-26" tabindex="-1"></a></span>
-<span id="cb82-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-27" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the  numerator of IP weights for C, */</span></span>
-<span id="cb82-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-28" tabindex="-1"></a><span class="co">/* including quitting smoking */</span></span>
-<span id="cb82-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-29" tabindex="-1"></a><span class="kw">logit</span> cens qsmk</span>
-<span id="cb82-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-30" tabindex="-1"></a><span class="kw">predict</span> pn_cens, pr</span>
-<span id="cb82-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-31" tabindex="-1"></a></span>
-<span id="cb82-32"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-32" tabindex="-1"></a><span class="co">/*Generate the stabilized weights for A (sw_a)*/</span></span>
-<span id="cb82-33"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-33" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
-<span id="cb82-34"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-34" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
-<span id="cb82-35"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-35" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
-<span id="cb82-36"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-36" tabindex="-1"></a></span>
-<span id="cb82-37"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-37" tabindex="-1"></a><span class="co">/*Generate the stabilized weights for C (sw_c)*/</span></span>
-<span id="cb82-38"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-38" tabindex="-1"></a><span class="co">/*</span><span class="al">NOTE</span><span class="co">: the conditional probability estimates generated by our logistic models */</span></span>
-<span id="cb82-39"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-39" tabindex="-1"></a><span class="co">/* for C represent the conditional probability of being censored (C=1)*/</span></span>
-<span id="cb82-40"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-40" tabindex="-1"></a><span class="co">/*We want weights for the conditional probability of bing uncensored, Pr(C=0|A,L)*/</span></span>
-<span id="cb82-41"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-41" tabindex="-1"></a><span class="kw">gen</span> sw_c=.</span>
-<span id="cb82-42"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-42" tabindex="-1"></a><span class="kw">replace</span> sw_c=(1-pn_cens)/(1-pd_cens) <span class="kw">if</span> cens==0</span>
-<span id="cb82-43"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-43" tabindex="-1"></a></span>
-<span id="cb82-44"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-44" tabindex="-1"></a><span class="co">/*Generate the final stabilized weights and check distribution*/</span></span>
-<span id="cb82-45"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-45" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=sw_a*sw_c</span>
-<span id="cb82-46"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-46" tabindex="-1"></a><span class="kw">summarize</span> <span class="kw">sw</span></span>
-<span id="cb82-47"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-47" tabindex="-1"></a></span>
-<span id="cb82-48"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-48" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
-<span id="cb82-49"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb82-49" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [pw=<span class="kw">sw</span>], <span class="kw">cluster</span>(seqn)</span></code></pre></div>
+<div class="sourceCode" id="cb199"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb199-1"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs, <span class="kw">clear</span></span>
+<span id="cb199-2"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-2" tabindex="-1"></a></span>
+<span id="cb199-3"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-3" tabindex="-1"></a><span class="co">/*Analysis including all individuals regardless of missing wt82 status: N=1629*/</span></span>
+<span id="cb199-4"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-4" tabindex="-1"></a><span class="co">/*Generate censoring indicator: C = 1 if wt82 missing*/</span></span>
+<span id="cb199-5"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-5" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">byte</span> cens = (wt82 == .)</span>
+<span id="cb199-6"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-6" tabindex="-1"></a></span>
+<span id="cb199-7"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-7" tabindex="-1"></a><span class="co">/*Check distribution of censoring by quitting smoking and baseline weight*/</span></span>
+<span id="cb199-8"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-8" tabindex="-1"></a><span class="kw">tab</span> cens qsmk, column</span>
+<span id="cb199-9"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-9" tabindex="-1"></a><span class="kw">bys</span> cens: <span class="kw">summarize</span> wt71</span>
+<span id="cb199-10"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-10" tabindex="-1"></a></span>
+<span id="cb199-11"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-11" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the  denominator of IP weight for A*/</span></span>
+<span id="cb199-12"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-12" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb199-13"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-13" tabindex="-1"></a>c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb199-14"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-14" tabindex="-1"></a><span class="kw">predict</span> pd_qsmk, pr</span>
+<span id="cb199-15"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-15" tabindex="-1"></a></span>
+<span id="cb199-16"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-16" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the numerator of IP weights for A*/</span></span>
+<span id="cb199-17"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-17" tabindex="-1"></a><span class="kw">logit</span> qsmk</span>
+<span id="cb199-18"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-18" tabindex="-1"></a><span class="kw">predict</span> pn_qsmk, pr</span>
+<span id="cb199-19"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-19" tabindex="-1"></a></span>
+<span id="cb199-20"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-20" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the denominator of IP weights for C, */</span></span>
+<span id="cb199-21"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-21" tabindex="-1"></a><span class="co">/* including quitting smoking*/</span></span>
+<span id="cb199-22"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-22" tabindex="-1"></a><span class="kw">logit</span> cens qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb199-23"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-23" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
+<span id="cb199-24"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-24" tabindex="-1"></a>ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb199-25"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-25" tabindex="-1"></a><span class="kw">predict</span> pd_cens, pr</span>
+<span id="cb199-26"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-26" tabindex="-1"></a></span>
+<span id="cb199-27"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-27" tabindex="-1"></a><span class="co">/*Fit logistic regression model for the  numerator of IP weights for C, */</span></span>
+<span id="cb199-28"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-28" tabindex="-1"></a><span class="co">/* including quitting smoking */</span></span>
+<span id="cb199-29"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-29" tabindex="-1"></a><span class="kw">logit</span> cens qsmk</span>
+<span id="cb199-30"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-30" tabindex="-1"></a><span class="kw">predict</span> pn_cens, pr</span>
+<span id="cb199-31"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-31" tabindex="-1"></a></span>
+<span id="cb199-32"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-32" tabindex="-1"></a><span class="co">/*Generate the stabilized weights for A (sw_a)*/</span></span>
+<span id="cb199-33"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-33" tabindex="-1"></a><span class="kw">gen</span> sw_a=.</span>
+<span id="cb199-34"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-34" tabindex="-1"></a><span class="kw">replace</span> sw_a=pn_qsmk/pd_qsmk <span class="kw">if</span> qsmk==1</span>
+<span id="cb199-35"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-35" tabindex="-1"></a><span class="kw">replace</span> sw_a=(1-pn_qsmk)/(1-pd_qsmk) <span class="kw">if</span> qsmk==0</span>
+<span id="cb199-36"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-36" tabindex="-1"></a></span>
+<span id="cb199-37"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-37" tabindex="-1"></a><span class="co">/*Generate the stabilized weights for C (sw_c)*/</span></span>
+<span id="cb199-38"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-38" tabindex="-1"></a><span class="co">/*</span><span class="al">NOTE</span><span class="co">: the conditional probability estimates generated by our logistic models */</span></span>
+<span id="cb199-39"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-39" tabindex="-1"></a><span class="co">/* for C represent the conditional probability of being censored (C=1)*/</span></span>
+<span id="cb199-40"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-40" tabindex="-1"></a><span class="co">/*We want weights for the conditional probability of bing uncensored, Pr(C=0|A,L)*/</span></span>
+<span id="cb199-41"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-41" tabindex="-1"></a><span class="kw">gen</span> sw_c=.</span>
+<span id="cb199-42"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-42" tabindex="-1"></a><span class="kw">replace</span> sw_c=(1-pn_cens)/(1-pd_cens) <span class="kw">if</span> cens==0</span>
+<span id="cb199-43"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-43" tabindex="-1"></a></span>
+<span id="cb199-44"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-44" tabindex="-1"></a><span class="co">/*Generate the final stabilized weights and check distribution*/</span></span>
+<span id="cb199-45"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-45" tabindex="-1"></a><span class="kw">gen</span> <span class="kw">sw</span>=sw_a*sw_c</span>
+<span id="cb199-46"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-46" tabindex="-1"></a><span class="kw">summarize</span> <span class="kw">sw</span></span>
+<span id="cb199-47"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-47" tabindex="-1"></a></span>
+<span id="cb199-48"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-48" tabindex="-1"></a><span class="co">/*Fit marginal structural model in the pseudopopulation*/</span></span>
+<span id="cb199-49"><a href="ip-weighting-and-marginal-structural-models-stata.html#cb199-49" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk [pw=<span class="kw">sw</span>], <span class="kw">cluster</span>(seqn)</span></code></pre></div>
 <pre><code>| Key               |
 |-------------------|
 |     frequency     |
diff --git a/docs/ip-weighting-and-marginal-structural-models.html b/docs/ip-weighting-and-marginal-structural-models.html
index eda0d94..6f7627f 100644
--- a/docs/ip-weighting-and-marginal-structural-models.html
+++ b/docs/ip-weighting-and-marginal-structural-models.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -315,115 +315,115 @@ <h2>Program 12.1<a href="ip-weighting-and-marginal-structural-models.html#progra
 <ul>
 <li>Descriptive statistics from NHEFS data (Table 12.1)</li>
 </ul>
-<div class="sourceCode" id="cb10"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb10-1"><a href="ip-weighting-and-marginal-structural-models.html#cb10-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb11"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb11-1"><a href="ip-weighting-and-marginal-structural-models.html#cb11-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
-<span id="cb11-2"><a href="ip-weighting-and-marginal-structural-models.html#cb11-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb11-3"><a href="ip-weighting-and-marginal-structural-models.html#cb11-3" tabindex="-1"></a></span>
-<span id="cb11-4"><a href="ip-weighting-and-marginal-structural-models.html#cb11-4" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb11-5"><a href="ip-weighting-and-marginal-structural-models.html#cb11-5" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb11-6"><a href="ip-weighting-and-marginal-structural-models.html#cb11-6" tabindex="-1"></a></span>
-<span id="cb11-7"><a href="ip-weighting-and-marginal-structural-models.html#cb11-7" tabindex="-1"></a><span class="co"># provisionally ignore subjects with missing values for weight in 1982</span></span>
-<span id="cb11-8"><a href="ip-weighting-and-marginal-structural-models.html#cb11-8" tabindex="-1"></a>nhefs.nmv <span class="ot">&lt;-</span></span>
-<span id="cb11-9"><a href="ip-weighting-and-marginal-structural-models.html#cb11-9" tabindex="-1"></a>  nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82)),]</span>
-<span id="cb11-10"><a href="ip-weighting-and-marginal-structural-models.html#cb11-10" tabindex="-1"></a></span>
-<span id="cb11-11"><a href="ip-weighting-and-marginal-structural-models.html#cb11-11" tabindex="-1"></a><span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv)</span>
-<span id="cb11-12"><a href="ip-weighting-and-marginal-structural-models.html#cb11-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb11-13"><a href="ip-weighting-and-marginal-structural-models.html#cb11-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb11-14"><a href="ip-weighting-and-marginal-structural-models.html#cb11-14" tabindex="-1"></a><span class="co">#&gt; lm(formula = wt82_71 ~ qsmk, data = nhefs.nmv)</span></span>
-<span id="cb11-15"><a href="ip-weighting-and-marginal-structural-models.html#cb11-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb11-16"><a href="ip-weighting-and-marginal-structural-models.html#cb11-16" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb11-17"><a href="ip-weighting-and-marginal-structural-models.html#cb11-17" tabindex="-1"></a><span class="co">#&gt; (Intercept)         qsmk  </span></span>
-<span id="cb11-18"><a href="ip-weighting-and-marginal-structural-models.html#cb11-18" tabindex="-1"></a><span class="co">#&gt;       1.984        2.541</span></span>
-<span id="cb11-19"><a href="ip-weighting-and-marginal-structural-models.html#cb11-19" tabindex="-1"></a><span class="co"># Smoking cessation</span></span>
-<span id="cb11-20"><a href="ip-weighting-and-marginal-structural-models.html#cb11-20" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv), <span class="fu">data.frame</span>(<span class="at">qsmk =</span> <span class="dv">1</span>))</span>
-<span id="cb11-21"><a href="ip-weighting-and-marginal-structural-models.html#cb11-21" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
-<span id="cb11-22"><a href="ip-weighting-and-marginal-structural-models.html#cb11-22" tabindex="-1"></a><span class="co">#&gt; 4.525079</span></span>
-<span id="cb11-23"><a href="ip-weighting-and-marginal-structural-models.html#cb11-23" tabindex="-1"></a><span class="co"># No smoking cessation</span></span>
-<span id="cb11-24"><a href="ip-weighting-and-marginal-structural-models.html#cb11-24" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv), <span class="fu">data.frame</span>(<span class="at">qsmk =</span> <span class="dv">0</span>))</span>
-<span id="cb11-25"><a href="ip-weighting-and-marginal-structural-models.html#cb11-25" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
-<span id="cb11-26"><a href="ip-weighting-and-marginal-structural-models.html#cb11-26" tabindex="-1"></a><span class="co">#&gt; 1.984498</span></span>
-<span id="cb11-27"><a href="ip-weighting-and-marginal-structural-models.html#cb11-27" tabindex="-1"></a></span>
-<span id="cb11-28"><a href="ip-weighting-and-marginal-structural-models.html#cb11-28" tabindex="-1"></a><span class="co"># Table</span></span>
-<span id="cb11-29"><a href="ip-weighting-and-marginal-structural-models.html#cb11-29" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>age)</span>
-<span id="cb11-30"><a href="ip-weighting-and-marginal-structural-models.html#cb11-30" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-31"><a href="ip-weighting-and-marginal-structural-models.html#cb11-31" tabindex="-1"></a><span class="co">#&gt;   25.00   33.00   42.00   42.79   51.00   72.00</span></span>
-<span id="cb11-32"><a href="ip-weighting-and-marginal-structural-models.html#cb11-32" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>wt71)</span>
-<span id="cb11-33"><a href="ip-weighting-and-marginal-structural-models.html#cb11-33" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-34"><a href="ip-weighting-and-marginal-structural-models.html#cb11-34" tabindex="-1"></a><span class="co">#&gt;   40.82   59.19   68.49   70.30   79.38  151.73</span></span>
-<span id="cb11-35"><a href="ip-weighting-and-marginal-structural-models.html#cb11-35" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>smokeintensity)</span>
-<span id="cb11-36"><a href="ip-weighting-and-marginal-structural-models.html#cb11-36" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-37"><a href="ip-weighting-and-marginal-structural-models.html#cb11-37" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   20.00   21.19   30.00   60.00</span></span>
-<span id="cb11-38"><a href="ip-weighting-and-marginal-structural-models.html#cb11-38" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>smokeyrs)</span>
-<span id="cb11-39"><a href="ip-weighting-and-marginal-structural-models.html#cb11-39" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-40"><a href="ip-weighting-and-marginal-structural-models.html#cb11-40" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   23.00   24.09   32.00   64.00</span></span>
-<span id="cb11-41"><a href="ip-weighting-and-marginal-structural-models.html#cb11-41" tabindex="-1"></a></span>
-<span id="cb11-42"><a href="ip-weighting-and-marginal-structural-models.html#cb11-42" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>age)</span>
-<span id="cb11-43"><a href="ip-weighting-and-marginal-structural-models.html#cb11-43" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-44"><a href="ip-weighting-and-marginal-structural-models.html#cb11-44" tabindex="-1"></a><span class="co">#&gt;   25.00   35.00   46.00   46.17   56.00   74.00</span></span>
-<span id="cb11-45"><a href="ip-weighting-and-marginal-structural-models.html#cb11-45" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>wt71)</span>
-<span id="cb11-46"><a href="ip-weighting-and-marginal-structural-models.html#cb11-46" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-47"><a href="ip-weighting-and-marginal-structural-models.html#cb11-47" tabindex="-1"></a><span class="co">#&gt;   39.58   60.67   71.21   72.35   81.08  136.98</span></span>
-<span id="cb11-48"><a href="ip-weighting-and-marginal-structural-models.html#cb11-48" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>smokeintensity)</span>
-<span id="cb11-49"><a href="ip-weighting-and-marginal-structural-models.html#cb11-49" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-50"><a href="ip-weighting-and-marginal-structural-models.html#cb11-50" tabindex="-1"></a><span class="co">#&gt;     1.0    10.0    20.0    18.6    25.0    80.0</span></span>
-<span id="cb11-51"><a href="ip-weighting-and-marginal-structural-models.html#cb11-51" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>smokeyrs)</span>
-<span id="cb11-52"><a href="ip-weighting-and-marginal-structural-models.html#cb11-52" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb11-53"><a href="ip-weighting-and-marginal-structural-models.html#cb11-53" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   26.00   26.03   35.00   60.00</span></span>
-<span id="cb11-54"><a href="ip-weighting-and-marginal-structural-models.html#cb11-54" tabindex="-1"></a></span>
-<span id="cb11-55"><a href="ip-weighting-and-marginal-structural-models.html#cb11-55" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>sex)</span>
-<span id="cb11-56"><a href="ip-weighting-and-marginal-structural-models.html#cb11-56" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-57"><a href="ip-weighting-and-marginal-structural-models.html#cb11-57" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
-<span id="cb11-58"><a href="ip-weighting-and-marginal-structural-models.html#cb11-58" tabindex="-1"></a><span class="co">#&gt;   0 542 621</span></span>
-<span id="cb11-59"><a href="ip-weighting-and-marginal-structural-models.html#cb11-59" tabindex="-1"></a><span class="co">#&gt;   1 220 183</span></span>
-<span id="cb11-60"><a href="ip-weighting-and-marginal-structural-models.html#cb11-60" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>sex), <span class="dv">1</span>)</span>
-<span id="cb11-61"><a href="ip-weighting-and-marginal-structural-models.html#cb11-61" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-62"><a href="ip-weighting-and-marginal-structural-models.html#cb11-62" tabindex="-1"></a><span class="co">#&gt;             0         1</span></span>
-<span id="cb11-63"><a href="ip-weighting-and-marginal-structural-models.html#cb11-63" tabindex="-1"></a><span class="co">#&gt;   0 0.4660361 0.5339639</span></span>
-<span id="cb11-64"><a href="ip-weighting-and-marginal-structural-models.html#cb11-64" tabindex="-1"></a><span class="co">#&gt;   1 0.5459057 0.4540943</span></span>
-<span id="cb11-65"><a href="ip-weighting-and-marginal-structural-models.html#cb11-65" tabindex="-1"></a></span>
-<span id="cb11-66"><a href="ip-weighting-and-marginal-structural-models.html#cb11-66" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>race)</span>
-<span id="cb11-67"><a href="ip-weighting-and-marginal-structural-models.html#cb11-67" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-68"><a href="ip-weighting-and-marginal-structural-models.html#cb11-68" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
-<span id="cb11-69"><a href="ip-weighting-and-marginal-structural-models.html#cb11-69" tabindex="-1"></a><span class="co">#&gt;   0 993 170</span></span>
-<span id="cb11-70"><a href="ip-weighting-and-marginal-structural-models.html#cb11-70" tabindex="-1"></a><span class="co">#&gt;   1 367  36</span></span>
-<span id="cb11-71"><a href="ip-weighting-and-marginal-structural-models.html#cb11-71" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>race), <span class="dv">1</span>)</span>
-<span id="cb11-72"><a href="ip-weighting-and-marginal-structural-models.html#cb11-72" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-73"><a href="ip-weighting-and-marginal-structural-models.html#cb11-73" tabindex="-1"></a><span class="co">#&gt;              0          1</span></span>
-<span id="cb11-74"><a href="ip-weighting-and-marginal-structural-models.html#cb11-74" tabindex="-1"></a><span class="co">#&gt;   0 0.85382631 0.14617369</span></span>
-<span id="cb11-75"><a href="ip-weighting-and-marginal-structural-models.html#cb11-75" tabindex="-1"></a><span class="co">#&gt;   1 0.91066998 0.08933002</span></span>
-<span id="cb11-76"><a href="ip-weighting-and-marginal-structural-models.html#cb11-76" tabindex="-1"></a></span>
-<span id="cb11-77"><a href="ip-weighting-and-marginal-structural-models.html#cb11-77" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>education)</span>
-<span id="cb11-78"><a href="ip-weighting-and-marginal-structural-models.html#cb11-78" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-79"><a href="ip-weighting-and-marginal-structural-models.html#cb11-79" tabindex="-1"></a><span class="co">#&gt;       1   2   3   4   5</span></span>
-<span id="cb11-80"><a href="ip-weighting-and-marginal-structural-models.html#cb11-80" tabindex="-1"></a><span class="co">#&gt;   0 210 266 480  92 115</span></span>
-<span id="cb11-81"><a href="ip-weighting-and-marginal-structural-models.html#cb11-81" tabindex="-1"></a><span class="co">#&gt;   1  81  74 157  29  62</span></span>
-<span id="cb11-82"><a href="ip-weighting-and-marginal-structural-models.html#cb11-82" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>education), <span class="dv">1</span>)</span>
-<span id="cb11-83"><a href="ip-weighting-and-marginal-structural-models.html#cb11-83" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-84"><a href="ip-weighting-and-marginal-structural-models.html#cb11-84" tabindex="-1"></a><span class="co">#&gt;              1          2          3          4          5</span></span>
-<span id="cb11-85"><a href="ip-weighting-and-marginal-structural-models.html#cb11-85" tabindex="-1"></a><span class="co">#&gt;   0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220</span></span>
-<span id="cb11-86"><a href="ip-weighting-and-marginal-structural-models.html#cb11-86" tabindex="-1"></a><span class="co">#&gt;   1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615</span></span>
-<span id="cb11-87"><a href="ip-weighting-and-marginal-structural-models.html#cb11-87" tabindex="-1"></a></span>
-<span id="cb11-88"><a href="ip-weighting-and-marginal-structural-models.html#cb11-88" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>exercise)</span>
-<span id="cb11-89"><a href="ip-weighting-and-marginal-structural-models.html#cb11-89" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-90"><a href="ip-weighting-and-marginal-structural-models.html#cb11-90" tabindex="-1"></a><span class="co">#&gt;       0   1   2</span></span>
-<span id="cb11-91"><a href="ip-weighting-and-marginal-structural-models.html#cb11-91" tabindex="-1"></a><span class="co">#&gt;   0 237 485 441</span></span>
-<span id="cb11-92"><a href="ip-weighting-and-marginal-structural-models.html#cb11-92" tabindex="-1"></a><span class="co">#&gt;   1  63 176 164</span></span>
-<span id="cb11-93"><a href="ip-weighting-and-marginal-structural-models.html#cb11-93" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>exercise), <span class="dv">1</span>)</span>
-<span id="cb11-94"><a href="ip-weighting-and-marginal-structural-models.html#cb11-94" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-95"><a href="ip-weighting-and-marginal-structural-models.html#cb11-95" tabindex="-1"></a><span class="co">#&gt;             0         1         2</span></span>
-<span id="cb11-96"><a href="ip-weighting-and-marginal-structural-models.html#cb11-96" tabindex="-1"></a><span class="co">#&gt;   0 0.2037833 0.4170249 0.3791917</span></span>
-<span id="cb11-97"><a href="ip-weighting-and-marginal-structural-models.html#cb11-97" tabindex="-1"></a><span class="co">#&gt;   1 0.1563275 0.4367246 0.4069479</span></span>
-<span id="cb11-98"><a href="ip-weighting-and-marginal-structural-models.html#cb11-98" tabindex="-1"></a></span>
-<span id="cb11-99"><a href="ip-weighting-and-marginal-structural-models.html#cb11-99" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>active)</span>
-<span id="cb11-100"><a href="ip-weighting-and-marginal-structural-models.html#cb11-100" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-101"><a href="ip-weighting-and-marginal-structural-models.html#cb11-101" tabindex="-1"></a><span class="co">#&gt;       0   1   2</span></span>
-<span id="cb11-102"><a href="ip-weighting-and-marginal-structural-models.html#cb11-102" tabindex="-1"></a><span class="co">#&gt;   0 532 527 104</span></span>
-<span id="cb11-103"><a href="ip-weighting-and-marginal-structural-models.html#cb11-103" tabindex="-1"></a><span class="co">#&gt;   1 170 188  45</span></span>
-<span id="cb11-104"><a href="ip-weighting-and-marginal-structural-models.html#cb11-104" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>active), <span class="dv">1</span>)</span>
-<span id="cb11-105"><a href="ip-weighting-and-marginal-structural-models.html#cb11-105" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb11-106"><a href="ip-weighting-and-marginal-structural-models.html#cb11-106" tabindex="-1"></a><span class="co">#&gt;             0         1         2</span></span>
-<span id="cb11-107"><a href="ip-weighting-and-marginal-structural-models.html#cb11-107" tabindex="-1"></a><span class="co">#&gt;   0 0.4574377 0.4531384 0.0894239</span></span>
-<span id="cb11-108"><a href="ip-weighting-and-marginal-structural-models.html#cb11-108" tabindex="-1"></a><span class="co">#&gt;   1 0.4218362 0.4665012 0.1116625</span></span></code></pre></div>
+<div class="sourceCode" id="cb18"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb18-1"><a href="ip-weighting-and-marginal-structural-models.html#cb18-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb19"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb19-1"><a href="ip-weighting-and-marginal-structural-models.html#cb19-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
+<span id="cb19-2"><a href="ip-weighting-and-marginal-structural-models.html#cb19-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb19-3"><a href="ip-weighting-and-marginal-structural-models.html#cb19-3" tabindex="-1"></a></span>
+<span id="cb19-4"><a href="ip-weighting-and-marginal-structural-models.html#cb19-4" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb19-5"><a href="ip-weighting-and-marginal-structural-models.html#cb19-5" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb19-6"><a href="ip-weighting-and-marginal-structural-models.html#cb19-6" tabindex="-1"></a></span>
+<span id="cb19-7"><a href="ip-weighting-and-marginal-structural-models.html#cb19-7" tabindex="-1"></a><span class="co"># provisionally ignore subjects with missing values for weight in 1982</span></span>
+<span id="cb19-8"><a href="ip-weighting-and-marginal-structural-models.html#cb19-8" tabindex="-1"></a>nhefs.nmv <span class="ot">&lt;-</span></span>
+<span id="cb19-9"><a href="ip-weighting-and-marginal-structural-models.html#cb19-9" tabindex="-1"></a>  nhefs[<span class="fu">which</span>(<span class="sc">!</span><span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82)),]</span>
+<span id="cb19-10"><a href="ip-weighting-and-marginal-structural-models.html#cb19-10" tabindex="-1"></a></span>
+<span id="cb19-11"><a href="ip-weighting-and-marginal-structural-models.html#cb19-11" tabindex="-1"></a><span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv)</span>
+<span id="cb19-12"><a href="ip-weighting-and-marginal-structural-models.html#cb19-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb19-13"><a href="ip-weighting-and-marginal-structural-models.html#cb19-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb19-14"><a href="ip-weighting-and-marginal-structural-models.html#cb19-14" tabindex="-1"></a><span class="co">#&gt; lm(formula = wt82_71 ~ qsmk, data = nhefs.nmv)</span></span>
+<span id="cb19-15"><a href="ip-weighting-and-marginal-structural-models.html#cb19-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb19-16"><a href="ip-weighting-and-marginal-structural-models.html#cb19-16" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb19-17"><a href="ip-weighting-and-marginal-structural-models.html#cb19-17" tabindex="-1"></a><span class="co">#&gt; (Intercept)         qsmk  </span></span>
+<span id="cb19-18"><a href="ip-weighting-and-marginal-structural-models.html#cb19-18" tabindex="-1"></a><span class="co">#&gt;       1.984        2.541</span></span></code></pre></div>
+<div class="sourceCode" id="cb20"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb20-1"><a href="ip-weighting-and-marginal-structural-models.html#cb20-1" tabindex="-1"></a><span class="co"># Smoking cessation</span></span>
+<span id="cb20-2"><a href="ip-weighting-and-marginal-structural-models.html#cb20-2" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv), <span class="fu">data.frame</span>(<span class="at">qsmk =</span> <span class="dv">1</span>))</span>
+<span id="cb20-3"><a href="ip-weighting-and-marginal-structural-models.html#cb20-3" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
+<span id="cb20-4"><a href="ip-weighting-and-marginal-structural-models.html#cb20-4" tabindex="-1"></a><span class="co">#&gt; 4.525079</span></span></code></pre></div>
+<div class="sourceCode" id="cb21"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb21-1"><a href="ip-weighting-and-marginal-structural-models.html#cb21-1" tabindex="-1"></a><span class="co"># No smoking cessation</span></span>
+<span id="cb21-2"><a href="ip-weighting-and-marginal-structural-models.html#cb21-2" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">lm</span>(wt82_71 <span class="sc">~</span> qsmk, <span class="at">data =</span> nhefs.nmv), <span class="fu">data.frame</span>(<span class="at">qsmk =</span> <span class="dv">0</span>))</span>
+<span id="cb21-3"><a href="ip-weighting-and-marginal-structural-models.html#cb21-3" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
+<span id="cb21-4"><a href="ip-weighting-and-marginal-structural-models.html#cb21-4" tabindex="-1"></a><span class="co">#&gt; 1.984498</span></span></code></pre></div>
+<div class="sourceCode" id="cb22"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb22-1"><a href="ip-weighting-and-marginal-structural-models.html#cb22-1" tabindex="-1"></a></span>
+<span id="cb22-2"><a href="ip-weighting-and-marginal-structural-models.html#cb22-2" tabindex="-1"></a><span class="co"># Table</span></span>
+<span id="cb22-3"><a href="ip-weighting-and-marginal-structural-models.html#cb22-3" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>age)</span>
+<span id="cb22-4"><a href="ip-weighting-and-marginal-structural-models.html#cb22-4" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb22-5"><a href="ip-weighting-and-marginal-structural-models.html#cb22-5" tabindex="-1"></a><span class="co">#&gt;   25.00   33.00   42.00   42.79   51.00   72.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb23"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb23-1"><a href="ip-weighting-and-marginal-structural-models.html#cb23-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>wt71)</span>
+<span id="cb23-2"><a href="ip-weighting-and-marginal-structural-models.html#cb23-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb23-3"><a href="ip-weighting-and-marginal-structural-models.html#cb23-3" tabindex="-1"></a><span class="co">#&gt;   40.82   59.19   68.49   70.30   79.38  151.73</span></span></code></pre></div>
+<div class="sourceCode" id="cb24"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb24-1"><a href="ip-weighting-and-marginal-structural-models.html#cb24-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>smokeintensity)</span>
+<span id="cb24-2"><a href="ip-weighting-and-marginal-structural-models.html#cb24-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb24-3"><a href="ip-weighting-and-marginal-structural-models.html#cb24-3" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   20.00   21.19   30.00   60.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb25"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb25-1"><a href="ip-weighting-and-marginal-structural-models.html#cb25-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>smokeyrs)</span>
+<span id="cb25-2"><a href="ip-weighting-and-marginal-structural-models.html#cb25-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb25-3"><a href="ip-weighting-and-marginal-structural-models.html#cb25-3" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   23.00   24.09   32.00   64.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb26"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb26-1"><a href="ip-weighting-and-marginal-structural-models.html#cb26-1" tabindex="-1"></a></span>
+<span id="cb26-2"><a href="ip-weighting-and-marginal-structural-models.html#cb26-2" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>age)</span>
+<span id="cb26-3"><a href="ip-weighting-and-marginal-structural-models.html#cb26-3" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb26-4"><a href="ip-weighting-and-marginal-structural-models.html#cb26-4" tabindex="-1"></a><span class="co">#&gt;   25.00   35.00   46.00   46.17   56.00   74.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb27"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb27-1"><a href="ip-weighting-and-marginal-structural-models.html#cb27-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>wt71)</span>
+<span id="cb27-2"><a href="ip-weighting-and-marginal-structural-models.html#cb27-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb27-3"><a href="ip-weighting-and-marginal-structural-models.html#cb27-3" tabindex="-1"></a><span class="co">#&gt;   39.58   60.67   71.21   72.35   81.08  136.98</span></span></code></pre></div>
+<div class="sourceCode" id="cb28"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb28-1"><a href="ip-weighting-and-marginal-structural-models.html#cb28-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>smokeintensity)</span>
+<span id="cb28-2"><a href="ip-weighting-and-marginal-structural-models.html#cb28-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb28-3"><a href="ip-weighting-and-marginal-structural-models.html#cb28-3" tabindex="-1"></a><span class="co">#&gt;     1.0    10.0    20.0    18.6    25.0    80.0</span></span></code></pre></div>
+<div class="sourceCode" id="cb29"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb29-1"><a href="ip-weighting-and-marginal-structural-models.html#cb29-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv[<span class="fu">which</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>smokeyrs)</span>
+<span id="cb29-2"><a href="ip-weighting-and-marginal-structural-models.html#cb29-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb29-3"><a href="ip-weighting-and-marginal-structural-models.html#cb29-3" tabindex="-1"></a><span class="co">#&gt;    1.00   15.00   26.00   26.03   35.00   60.00</span></span></code></pre></div>
+<div class="sourceCode" id="cb30"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb30-1"><a href="ip-weighting-and-marginal-structural-models.html#cb30-1" tabindex="-1"></a></span>
+<span id="cb30-2"><a href="ip-weighting-and-marginal-structural-models.html#cb30-2" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>sex)</span>
+<span id="cb30-3"><a href="ip-weighting-and-marginal-structural-models.html#cb30-3" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb30-4"><a href="ip-weighting-and-marginal-structural-models.html#cb30-4" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
+<span id="cb30-5"><a href="ip-weighting-and-marginal-structural-models.html#cb30-5" tabindex="-1"></a><span class="co">#&gt;   0 542 621</span></span>
+<span id="cb30-6"><a href="ip-weighting-and-marginal-structural-models.html#cb30-6" tabindex="-1"></a><span class="co">#&gt;   1 220 183</span></span></code></pre></div>
+<div class="sourceCode" id="cb31"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb31-1"><a href="ip-weighting-and-marginal-structural-models.html#cb31-1" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>sex), <span class="dv">1</span>)</span>
+<span id="cb31-2"><a href="ip-weighting-and-marginal-structural-models.html#cb31-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb31-3"><a href="ip-weighting-and-marginal-structural-models.html#cb31-3" tabindex="-1"></a><span class="co">#&gt;             0         1</span></span>
+<span id="cb31-4"><a href="ip-weighting-and-marginal-structural-models.html#cb31-4" tabindex="-1"></a><span class="co">#&gt;   0 0.4660361 0.5339639</span></span>
+<span id="cb31-5"><a href="ip-weighting-and-marginal-structural-models.html#cb31-5" tabindex="-1"></a><span class="co">#&gt;   1 0.5459057 0.4540943</span></span></code></pre></div>
+<div class="sourceCode" id="cb32"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb32-1"><a href="ip-weighting-and-marginal-structural-models.html#cb32-1" tabindex="-1"></a></span>
+<span id="cb32-2"><a href="ip-weighting-and-marginal-structural-models.html#cb32-2" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>race)</span>
+<span id="cb32-3"><a href="ip-weighting-and-marginal-structural-models.html#cb32-3" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb32-4"><a href="ip-weighting-and-marginal-structural-models.html#cb32-4" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
+<span id="cb32-5"><a href="ip-weighting-and-marginal-structural-models.html#cb32-5" tabindex="-1"></a><span class="co">#&gt;   0 993 170</span></span>
+<span id="cb32-6"><a href="ip-weighting-and-marginal-structural-models.html#cb32-6" tabindex="-1"></a><span class="co">#&gt;   1 367  36</span></span></code></pre></div>
+<div class="sourceCode" id="cb33"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb33-1"><a href="ip-weighting-and-marginal-structural-models.html#cb33-1" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>race), <span class="dv">1</span>)</span>
+<span id="cb33-2"><a href="ip-weighting-and-marginal-structural-models.html#cb33-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb33-3"><a href="ip-weighting-and-marginal-structural-models.html#cb33-3" tabindex="-1"></a><span class="co">#&gt;              0          1</span></span>
+<span id="cb33-4"><a href="ip-weighting-and-marginal-structural-models.html#cb33-4" tabindex="-1"></a><span class="co">#&gt;   0 0.85382631 0.14617369</span></span>
+<span id="cb33-5"><a href="ip-weighting-and-marginal-structural-models.html#cb33-5" tabindex="-1"></a><span class="co">#&gt;   1 0.91066998 0.08933002</span></span></code></pre></div>
+<div class="sourceCode" id="cb34"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb34-1"><a href="ip-weighting-and-marginal-structural-models.html#cb34-1" tabindex="-1"></a></span>
+<span id="cb34-2"><a href="ip-weighting-and-marginal-structural-models.html#cb34-2" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>education)</span>
+<span id="cb34-3"><a href="ip-weighting-and-marginal-structural-models.html#cb34-3" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb34-4"><a href="ip-weighting-and-marginal-structural-models.html#cb34-4" tabindex="-1"></a><span class="co">#&gt;       1   2   3   4   5</span></span>
+<span id="cb34-5"><a href="ip-weighting-and-marginal-structural-models.html#cb34-5" tabindex="-1"></a><span class="co">#&gt;   0 210 266 480  92 115</span></span>
+<span id="cb34-6"><a href="ip-weighting-and-marginal-structural-models.html#cb34-6" tabindex="-1"></a><span class="co">#&gt;   1  81  74 157  29  62</span></span></code></pre></div>
+<div class="sourceCode" id="cb35"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb35-1"><a href="ip-weighting-and-marginal-structural-models.html#cb35-1" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>education), <span class="dv">1</span>)</span>
+<span id="cb35-2"><a href="ip-weighting-and-marginal-structural-models.html#cb35-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb35-3"><a href="ip-weighting-and-marginal-structural-models.html#cb35-3" tabindex="-1"></a><span class="co">#&gt;              1          2          3          4          5</span></span>
+<span id="cb35-4"><a href="ip-weighting-and-marginal-structural-models.html#cb35-4" tabindex="-1"></a><span class="co">#&gt;   0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220</span></span>
+<span id="cb35-5"><a href="ip-weighting-and-marginal-structural-models.html#cb35-5" tabindex="-1"></a><span class="co">#&gt;   1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615</span></span></code></pre></div>
+<div class="sourceCode" id="cb36"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb36-1"><a href="ip-weighting-and-marginal-structural-models.html#cb36-1" tabindex="-1"></a></span>
+<span id="cb36-2"><a href="ip-weighting-and-marginal-structural-models.html#cb36-2" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>exercise)</span>
+<span id="cb36-3"><a href="ip-weighting-and-marginal-structural-models.html#cb36-3" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb36-4"><a href="ip-weighting-and-marginal-structural-models.html#cb36-4" tabindex="-1"></a><span class="co">#&gt;       0   1   2</span></span>
+<span id="cb36-5"><a href="ip-weighting-and-marginal-structural-models.html#cb36-5" tabindex="-1"></a><span class="co">#&gt;   0 237 485 441</span></span>
+<span id="cb36-6"><a href="ip-weighting-and-marginal-structural-models.html#cb36-6" tabindex="-1"></a><span class="co">#&gt;   1  63 176 164</span></span></code></pre></div>
+<div class="sourceCode" id="cb37"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb37-1"><a href="ip-weighting-and-marginal-structural-models.html#cb37-1" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>exercise), <span class="dv">1</span>)</span>
+<span id="cb37-2"><a href="ip-weighting-and-marginal-structural-models.html#cb37-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb37-3"><a href="ip-weighting-and-marginal-structural-models.html#cb37-3" tabindex="-1"></a><span class="co">#&gt;             0         1         2</span></span>
+<span id="cb37-4"><a href="ip-weighting-and-marginal-structural-models.html#cb37-4" tabindex="-1"></a><span class="co">#&gt;   0 0.2037833 0.4170249 0.3791917</span></span>
+<span id="cb37-5"><a href="ip-weighting-and-marginal-structural-models.html#cb37-5" tabindex="-1"></a><span class="co">#&gt;   1 0.1563275 0.4367246 0.4069479</span></span></code></pre></div>
+<div class="sourceCode" id="cb38"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb38-1"><a href="ip-weighting-and-marginal-structural-models.html#cb38-1" tabindex="-1"></a></span>
+<span id="cb38-2"><a href="ip-weighting-and-marginal-structural-models.html#cb38-2" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>active)</span>
+<span id="cb38-3"><a href="ip-weighting-and-marginal-structural-models.html#cb38-3" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb38-4"><a href="ip-weighting-and-marginal-structural-models.html#cb38-4" tabindex="-1"></a><span class="co">#&gt;       0   1   2</span></span>
+<span id="cb38-5"><a href="ip-weighting-and-marginal-structural-models.html#cb38-5" tabindex="-1"></a><span class="co">#&gt;   0 532 527 104</span></span>
+<span id="cb38-6"><a href="ip-weighting-and-marginal-structural-models.html#cb38-6" tabindex="-1"></a><span class="co">#&gt;   1 170 188  45</span></span></code></pre></div>
+<div class="sourceCode" id="cb39"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb39-1"><a href="ip-weighting-and-marginal-structural-models.html#cb39-1" tabindex="-1"></a><span class="fu">prop.table</span>(<span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>active), <span class="dv">1</span>)</span>
+<span id="cb39-2"><a href="ip-weighting-and-marginal-structural-models.html#cb39-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb39-3"><a href="ip-weighting-and-marginal-structural-models.html#cb39-3" tabindex="-1"></a><span class="co">#&gt;             0         1         2</span></span>
+<span id="cb39-4"><a href="ip-weighting-and-marginal-structural-models.html#cb39-4" tabindex="-1"></a><span class="co">#&gt;   0 0.4574377 0.4531384 0.0894239</span></span>
+<span id="cb39-5"><a href="ip-weighting-and-marginal-structural-models.html#cb39-5" tabindex="-1"></a><span class="co">#&gt;   1 0.4218362 0.4665012 0.1116625</span></span></code></pre></div>
 </div>
 <div id="program-12.2" class="section level2 hasAnchor">
 <h2>Program 12.2<a href="ip-weighting-and-marginal-structural-models.html#program-12.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -431,165 +431,165 @@ <h2>Program 12.2<a href="ip-weighting-and-marginal-structural-models.html#progra
 <li>Estimating IP weights</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb12"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb12-1"><a href="ip-weighting-and-marginal-structural-models.html#cb12-1" tabindex="-1"></a><span class="co"># Estimation of ip weights via a logistic model</span></span>
-<span id="cb12-2"><a href="ip-weighting-and-marginal-structural-models.html#cb12-2" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
-<span id="cb12-3"><a href="ip-weighting-and-marginal-structural-models.html#cb12-3" tabindex="-1"></a>  qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb12-4"><a href="ip-weighting-and-marginal-structural-models.html#cb12-4" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb12-5"><a href="ip-weighting-and-marginal-structural-models.html#cb12-5" tabindex="-1"></a>    <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb12-6"><a href="ip-weighting-and-marginal-structural-models.html#cb12-6" tabindex="-1"></a>    <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb12-7"><a href="ip-weighting-and-marginal-structural-models.html#cb12-7" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb12-8"><a href="ip-weighting-and-marginal-structural-models.html#cb12-8" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv</span>
-<span id="cb12-9"><a href="ip-weighting-and-marginal-structural-models.html#cb12-9" tabindex="-1"></a>)</span>
-<span id="cb12-10"><a href="ip-weighting-and-marginal-structural-models.html#cb12-10" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
-<span id="cb12-11"><a href="ip-weighting-and-marginal-structural-models.html#cb12-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-12"><a href="ip-weighting-and-marginal-structural-models.html#cb12-12" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb12-13"><a href="ip-weighting-and-marginal-structural-models.html#cb12-13" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + </span></span>
-<span id="cb12-14"><a href="ip-weighting-and-marginal-structural-models.html#cb12-14" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + </span></span>
-<span id="cb12-15"><a href="ip-weighting-and-marginal-structural-models.html#cb12-15" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), </span></span>
-<span id="cb12-16"><a href="ip-weighting-and-marginal-structural-models.html#cb12-16" tabindex="-1"></a><span class="co">#&gt;     family = binomial(), data = nhefs.nmv)</span></span>
-<span id="cb12-17"><a href="ip-weighting-and-marginal-structural-models.html#cb12-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-18"><a href="ip-weighting-and-marginal-structural-models.html#cb12-18" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb12-19"><a href="ip-weighting-and-marginal-structural-models.html#cb12-19" tabindex="-1"></a><span class="co">#&gt;                         Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb12-20"><a href="ip-weighting-and-marginal-structural-models.html#cb12-20" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.2425191  1.3808360  -1.624 0.104369    </span></span>
-<span id="cb12-21"><a href="ip-weighting-and-marginal-structural-models.html#cb12-21" tabindex="-1"></a><span class="co">#&gt; sex                   -0.5274782  0.1540496  -3.424 0.000617 ***</span></span>
-<span id="cb12-22"><a href="ip-weighting-and-marginal-structural-models.html#cb12-22" tabindex="-1"></a><span class="co">#&gt; race                  -0.8392636  0.2100665  -3.995 6.46e-05 ***</span></span>
-<span id="cb12-23"><a href="ip-weighting-and-marginal-structural-models.html#cb12-23" tabindex="-1"></a><span class="co">#&gt; age                    0.1212052  0.0512663   2.364 0.018068 *  </span></span>
-<span id="cb12-24"><a href="ip-weighting-and-marginal-structural-models.html#cb12-24" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.0008246  0.0005361  -1.538 0.124039    </span></span>
-<span id="cb12-25"><a href="ip-weighting-and-marginal-structural-models.html#cb12-25" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.0287755  0.1983506  -0.145 0.884653    </span></span>
-<span id="cb12-26"><a href="ip-weighting-and-marginal-structural-models.html#cb12-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.0864318  0.1780850   0.485 0.627435    </span></span>
-<span id="cb12-27"><a href="ip-weighting-and-marginal-structural-models.html#cb12-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.0636010  0.2732108   0.233 0.815924    </span></span>
-<span id="cb12-28"><a href="ip-weighting-and-marginal-structural-models.html#cb12-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.4759606  0.2262237   2.104 0.035384 *  </span></span>
-<span id="cb12-29"><a href="ip-weighting-and-marginal-structural-models.html#cb12-29" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.0772704  0.0152499  -5.067 4.04e-07 ***</span></span>
-<span id="cb12-30"><a href="ip-weighting-and-marginal-structural-models.html#cb12-30" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.0010451  0.0002866   3.647 0.000265 ***</span></span>
-<span id="cb12-31"><a href="ip-weighting-and-marginal-structural-models.html#cb12-31" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.0735966  0.0277775  -2.650 0.008061 ** </span></span>
-<span id="cb12-32"><a href="ip-weighting-and-marginal-structural-models.html#cb12-32" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.0008441  0.0004632   1.822 0.068398 .  </span></span>
-<span id="cb12-33"><a href="ip-weighting-and-marginal-structural-models.html#cb12-33" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.3548405  0.1801351   1.970 0.048855 *  </span></span>
-<span id="cb12-34"><a href="ip-weighting-and-marginal-structural-models.html#cb12-34" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.3957040  0.1872400   2.113 0.034571 *  </span></span>
-<span id="cb12-35"><a href="ip-weighting-and-marginal-structural-models.html#cb12-35" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.0319445  0.1329372   0.240 0.810100    </span></span>
-<span id="cb12-36"><a href="ip-weighting-and-marginal-structural-models.html#cb12-36" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.1767840  0.2149720   0.822 0.410873    </span></span>
-<span id="cb12-37"><a href="ip-weighting-and-marginal-structural-models.html#cb12-37" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.0152357  0.0263161  -0.579 0.562625    </span></span>
-<span id="cb12-38"><a href="ip-weighting-and-marginal-structural-models.html#cb12-38" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.0001352  0.0001632   0.829 0.407370    </span></span>
-<span id="cb12-39"><a href="ip-weighting-and-marginal-structural-models.html#cb12-39" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb12-40"><a href="ip-weighting-and-marginal-structural-models.html#cb12-40" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb12-41"><a href="ip-weighting-and-marginal-structural-models.html#cb12-41" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-42"><a href="ip-weighting-and-marginal-structural-models.html#cb12-42" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb12-43"><a href="ip-weighting-and-marginal-structural-models.html#cb12-43" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-44"><a href="ip-weighting-and-marginal-structural-models.html#cb12-44" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb12-45"><a href="ip-weighting-and-marginal-structural-models.html#cb12-45" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
-<span id="cb12-46"><a href="ip-weighting-and-marginal-structural-models.html#cb12-46" tabindex="-1"></a><span class="co">#&gt; AIC: 1714.9</span></span>
-<span id="cb12-47"><a href="ip-weighting-and-marginal-structural-models.html#cb12-47" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-48"><a href="ip-weighting-and-marginal-structural-models.html#cb12-48" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb12-49"><a href="ip-weighting-and-marginal-structural-models.html#cb12-49" tabindex="-1"></a></span>
-<span id="cb12-50"><a href="ip-weighting-and-marginal-structural-models.html#cb12-50" tabindex="-1"></a>p.qsmk.obs <span class="ot">&lt;-</span></span>
-<span id="cb12-51"><a href="ip-weighting-and-marginal-structural-models.html#cb12-51" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>,</span>
-<span id="cb12-52"><a href="ip-weighting-and-marginal-structural-models.html#cb12-52" tabindex="-1"></a>         <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>),</span>
-<span id="cb12-53"><a href="ip-weighting-and-marginal-structural-models.html#cb12-53" tabindex="-1"></a>         <span class="fu">predict</span>(fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>))</span>
-<span id="cb12-54"><a href="ip-weighting-and-marginal-structural-models.html#cb12-54" tabindex="-1"></a></span>
-<span id="cb12-55"><a href="ip-weighting-and-marginal-structural-models.html#cb12-55" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>w <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">/</span> p.qsmk.obs</span>
-<span id="cb12-56"><a href="ip-weighting-and-marginal-structural-models.html#cb12-56" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>w)</span>
-<span id="cb12-57"><a href="ip-weighting-and-marginal-structural-models.html#cb12-57" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb12-58"><a href="ip-weighting-and-marginal-structural-models.html#cb12-58" tabindex="-1"></a><span class="co">#&gt;   1.054   1.230   1.373   1.996   1.990  16.700</span></span>
-<span id="cb12-59"><a href="ip-weighting-and-marginal-structural-models.html#cb12-59" tabindex="-1"></a><span class="fu">sd</span>(nhefs.nmv<span class="sc">$</span>w)</span>
-<span id="cb12-60"><a href="ip-weighting-and-marginal-structural-models.html#cb12-60" tabindex="-1"></a><span class="co">#&gt; [1] 1.474787</span></span>
-<span id="cb12-61"><a href="ip-weighting-and-marginal-structural-models.html#cb12-61" tabindex="-1"></a></span>
-<span id="cb12-62"><a href="ip-weighting-and-marginal-structural-models.html#cb12-62" tabindex="-1"></a><span class="co"># install.packages(&quot;geepack&quot;) # install package if required</span></span>
-<span id="cb12-63"><a href="ip-weighting-and-marginal-structural-models.html#cb12-63" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
-<span id="cb12-64"><a href="ip-weighting-and-marginal-structural-models.html#cb12-64" tabindex="-1"></a>msm.w <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
-<span id="cb12-65"><a href="ip-weighting-and-marginal-structural-models.html#cb12-65" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
-<span id="cb12-66"><a href="ip-weighting-and-marginal-structural-models.html#cb12-66" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
-<span id="cb12-67"><a href="ip-weighting-and-marginal-structural-models.html#cb12-67" tabindex="-1"></a>  <span class="at">weights =</span> w,</span>
-<span id="cb12-68"><a href="ip-weighting-and-marginal-structural-models.html#cb12-68" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
-<span id="cb12-69"><a href="ip-weighting-and-marginal-structural-models.html#cb12-69" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb12-70"><a href="ip-weighting-and-marginal-structural-models.html#cb12-70" tabindex="-1"></a>)</span>
-<span id="cb12-71"><a href="ip-weighting-and-marginal-structural-models.html#cb12-71" tabindex="-1"></a><span class="fu">summary</span>(msm.w)</span>
-<span id="cb12-72"><a href="ip-weighting-and-marginal-structural-models.html#cb12-72" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-73"><a href="ip-weighting-and-marginal-structural-models.html#cb12-73" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb12-74"><a href="ip-weighting-and-marginal-structural-models.html#cb12-74" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, </span></span>
-<span id="cb12-75"><a href="ip-weighting-and-marginal-structural-models.html#cb12-75" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb12-76"><a href="ip-weighting-and-marginal-structural-models.html#cb12-76" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-77"><a href="ip-weighting-and-marginal-structural-models.html#cb12-77" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb12-78"><a href="ip-weighting-and-marginal-structural-models.html#cb12-78" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err  Wald Pr(&gt;|W|)    </span></span>
-<span id="cb12-79"><a href="ip-weighting-and-marginal-structural-models.html#cb12-79" tabindex="-1"></a><span class="co">#&gt; (Intercept)   1.7800  0.2247 62.73 2.33e-15 ***</span></span>
-<span id="cb12-80"><a href="ip-weighting-and-marginal-structural-models.html#cb12-80" tabindex="-1"></a><span class="co">#&gt; qsmk          3.4405  0.5255 42.87 5.86e-11 ***</span></span>
-<span id="cb12-81"><a href="ip-weighting-and-marginal-structural-models.html#cb12-81" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb12-82"><a href="ip-weighting-and-marginal-structural-models.html#cb12-82" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb12-83"><a href="ip-weighting-and-marginal-structural-models.html#cb12-83" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-84"><a href="ip-weighting-and-marginal-structural-models.html#cb12-84" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb12-85"><a href="ip-weighting-and-marginal-structural-models.html#cb12-85" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb12-86"><a href="ip-weighting-and-marginal-structural-models.html#cb12-86" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb12-87"><a href="ip-weighting-and-marginal-structural-models.html#cb12-87" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb12-88"><a href="ip-weighting-and-marginal-structural-models.html#cb12-88" tabindex="-1"></a><span class="co">#&gt; (Intercept)    65.06   4.221</span></span>
-<span id="cb12-89"><a href="ip-weighting-and-marginal-structural-models.html#cb12-89" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span>
-<span id="cb12-90"><a href="ip-weighting-and-marginal-structural-models.html#cb12-90" tabindex="-1"></a></span>
-<span id="cb12-91"><a href="ip-weighting-and-marginal-structural-models.html#cb12-91" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.w)</span>
-<span id="cb12-92"><a href="ip-weighting-and-marginal-structural-models.html#cb12-92" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.w))[, <span class="dv">2</span>]</span>
-<span id="cb12-93"><a href="ip-weighting-and-marginal-structural-models.html#cb12-93" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb12-94"><a href="ip-weighting-and-marginal-structural-models.html#cb12-94" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb12-95"><a href="ip-weighting-and-marginal-structural-models.html#cb12-95" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb12-96"><a href="ip-weighting-and-marginal-structural-models.html#cb12-96" tabindex="-1"></a><span class="co">#&gt;              beta   lcl  ucl</span></span>
-<span id="cb12-97"><a href="ip-weighting-and-marginal-structural-models.html#cb12-97" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.780 1.340 2.22</span></span>
-<span id="cb12-98"><a href="ip-weighting-and-marginal-structural-models.html#cb12-98" tabindex="-1"></a><span class="co">#&gt; qsmk        3.441 2.411 4.47</span></span>
-<span id="cb12-99"><a href="ip-weighting-and-marginal-structural-models.html#cb12-99" tabindex="-1"></a></span>
-<span id="cb12-100"><a href="ip-weighting-and-marginal-structural-models.html#cb12-100" tabindex="-1"></a><span class="co"># no association between sex and qsmk in pseudo-population</span></span>
-<span id="cb12-101"><a href="ip-weighting-and-marginal-structural-models.html#cb12-101" tabindex="-1"></a><span class="fu">xtabs</span>(nhefs.nmv<span class="sc">$</span>w <span class="sc">~</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">+</span> nhefs.nmv<span class="sc">$</span>qsmk)</span>
-<span id="cb12-102"><a href="ip-weighting-and-marginal-structural-models.html#cb12-102" tabindex="-1"></a><span class="co">#&gt;              nhefs.nmv$qsmk</span></span>
-<span id="cb12-103"><a href="ip-weighting-and-marginal-structural-models.html#cb12-103" tabindex="-1"></a><span class="co">#&gt; nhefs.nmv$sex     0     1</span></span>
-<span id="cb12-104"><a href="ip-weighting-and-marginal-structural-models.html#cb12-104" tabindex="-1"></a><span class="co">#&gt;             0 763.6 763.6</span></span>
-<span id="cb12-105"><a href="ip-weighting-and-marginal-structural-models.html#cb12-105" tabindex="-1"></a><span class="co">#&gt;             1 801.7 797.2</span></span>
-<span id="cb12-106"><a href="ip-weighting-and-marginal-structural-models.html#cb12-106" tabindex="-1"></a></span>
-<span id="cb12-107"><a href="ip-weighting-and-marginal-structural-models.html#cb12-107" tabindex="-1"></a><span class="co"># &quot;check&quot; for positivity (White women)</span></span>
-<span id="cb12-108"><a href="ip-weighting-and-marginal-structural-models.html#cb12-108" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>age[nhefs.nmv<span class="sc">$</span>race <span class="sc">==</span> <span class="dv">0</span> <span class="sc">&amp;</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">==</span> <span class="dv">1</span>],</span>
-<span id="cb12-109"><a href="ip-weighting-and-marginal-structural-models.html#cb12-109" tabindex="-1"></a>      nhefs.nmv<span class="sc">$</span>qsmk[nhefs.nmv<span class="sc">$</span>race <span class="sc">==</span> <span class="dv">0</span> <span class="sc">&amp;</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">==</span> <span class="dv">1</span>])</span>
-<span id="cb12-110"><a href="ip-weighting-and-marginal-structural-models.html#cb12-110" tabindex="-1"></a><span class="co">#&gt;     </span></span>
-<span id="cb12-111"><a href="ip-weighting-and-marginal-structural-models.html#cb12-111" tabindex="-1"></a><span class="co">#&gt;       0  1</span></span>
-<span id="cb12-112"><a href="ip-weighting-and-marginal-structural-models.html#cb12-112" tabindex="-1"></a><span class="co">#&gt;   25 24  3</span></span>
-<span id="cb12-113"><a href="ip-weighting-and-marginal-structural-models.html#cb12-113" tabindex="-1"></a><span class="co">#&gt;   26 14  5</span></span>
-<span id="cb12-114"><a href="ip-weighting-and-marginal-structural-models.html#cb12-114" tabindex="-1"></a><span class="co">#&gt;   27 18  2</span></span>
-<span id="cb12-115"><a href="ip-weighting-and-marginal-structural-models.html#cb12-115" tabindex="-1"></a><span class="co">#&gt;   28 20  5</span></span>
-<span id="cb12-116"><a href="ip-weighting-and-marginal-structural-models.html#cb12-116" tabindex="-1"></a><span class="co">#&gt;   29 15  4</span></span>
-<span id="cb12-117"><a href="ip-weighting-and-marginal-structural-models.html#cb12-117" tabindex="-1"></a><span class="co">#&gt;   30 14  5</span></span>
-<span id="cb12-118"><a href="ip-weighting-and-marginal-structural-models.html#cb12-118" tabindex="-1"></a><span class="co">#&gt;   31 11  5</span></span>
-<span id="cb12-119"><a href="ip-weighting-and-marginal-structural-models.html#cb12-119" tabindex="-1"></a><span class="co">#&gt;   32 14  7</span></span>
-<span id="cb12-120"><a href="ip-weighting-and-marginal-structural-models.html#cb12-120" tabindex="-1"></a><span class="co">#&gt;   33 12  3</span></span>
-<span id="cb12-121"><a href="ip-weighting-and-marginal-structural-models.html#cb12-121" tabindex="-1"></a><span class="co">#&gt;   34 22  5</span></span>
-<span id="cb12-122"><a href="ip-weighting-and-marginal-structural-models.html#cb12-122" tabindex="-1"></a><span class="co">#&gt;   35 16  5</span></span>
-<span id="cb12-123"><a href="ip-weighting-and-marginal-structural-models.html#cb12-123" tabindex="-1"></a><span class="co">#&gt;   36 13  3</span></span>
-<span id="cb12-124"><a href="ip-weighting-and-marginal-structural-models.html#cb12-124" tabindex="-1"></a><span class="co">#&gt;   37 14  1</span></span>
-<span id="cb12-125"><a href="ip-weighting-and-marginal-structural-models.html#cb12-125" tabindex="-1"></a><span class="co">#&gt;   38  6  2</span></span>
-<span id="cb12-126"><a href="ip-weighting-and-marginal-structural-models.html#cb12-126" tabindex="-1"></a><span class="co">#&gt;   39 19  4</span></span>
-<span id="cb12-127"><a href="ip-weighting-and-marginal-structural-models.html#cb12-127" tabindex="-1"></a><span class="co">#&gt;   40 10  4</span></span>
-<span id="cb12-128"><a href="ip-weighting-and-marginal-structural-models.html#cb12-128" tabindex="-1"></a><span class="co">#&gt;   41 13  3</span></span>
-<span id="cb12-129"><a href="ip-weighting-and-marginal-structural-models.html#cb12-129" tabindex="-1"></a><span class="co">#&gt;   42 16  3</span></span>
-<span id="cb12-130"><a href="ip-weighting-and-marginal-structural-models.html#cb12-130" tabindex="-1"></a><span class="co">#&gt;   43 14  3</span></span>
-<span id="cb12-131"><a href="ip-weighting-and-marginal-structural-models.html#cb12-131" tabindex="-1"></a><span class="co">#&gt;   44  9  4</span></span>
-<span id="cb12-132"><a href="ip-weighting-and-marginal-structural-models.html#cb12-132" tabindex="-1"></a><span class="co">#&gt;   45 12  5</span></span>
-<span id="cb12-133"><a href="ip-weighting-and-marginal-structural-models.html#cb12-133" tabindex="-1"></a><span class="co">#&gt;   46 19  4</span></span>
-<span id="cb12-134"><a href="ip-weighting-and-marginal-structural-models.html#cb12-134" tabindex="-1"></a><span class="co">#&gt;   47 19  4</span></span>
-<span id="cb12-135"><a href="ip-weighting-and-marginal-structural-models.html#cb12-135" tabindex="-1"></a><span class="co">#&gt;   48 19  4</span></span>
-<span id="cb12-136"><a href="ip-weighting-and-marginal-structural-models.html#cb12-136" tabindex="-1"></a><span class="co">#&gt;   49 11  3</span></span>
-<span id="cb12-137"><a href="ip-weighting-and-marginal-structural-models.html#cb12-137" tabindex="-1"></a><span class="co">#&gt;   50 18  4</span></span>
-<span id="cb12-138"><a href="ip-weighting-and-marginal-structural-models.html#cb12-138" tabindex="-1"></a><span class="co">#&gt;   51  9  3</span></span>
-<span id="cb12-139"><a href="ip-weighting-and-marginal-structural-models.html#cb12-139" tabindex="-1"></a><span class="co">#&gt;   52 11  3</span></span>
-<span id="cb12-140"><a href="ip-weighting-and-marginal-structural-models.html#cb12-140" tabindex="-1"></a><span class="co">#&gt;   53 11  4</span></span>
-<span id="cb12-141"><a href="ip-weighting-and-marginal-structural-models.html#cb12-141" tabindex="-1"></a><span class="co">#&gt;   54 17  9</span></span>
-<span id="cb12-142"><a href="ip-weighting-and-marginal-structural-models.html#cb12-142" tabindex="-1"></a><span class="co">#&gt;   55  9  4</span></span>
-<span id="cb12-143"><a href="ip-weighting-and-marginal-structural-models.html#cb12-143" tabindex="-1"></a><span class="co">#&gt;   56  8  7</span></span>
-<span id="cb12-144"><a href="ip-weighting-and-marginal-structural-models.html#cb12-144" tabindex="-1"></a><span class="co">#&gt;   57  9  2</span></span>
-<span id="cb12-145"><a href="ip-weighting-and-marginal-structural-models.html#cb12-145" tabindex="-1"></a><span class="co">#&gt;   58  8  4</span></span>
-<span id="cb12-146"><a href="ip-weighting-and-marginal-structural-models.html#cb12-146" tabindex="-1"></a><span class="co">#&gt;   59  5  4</span></span>
-<span id="cb12-147"><a href="ip-weighting-and-marginal-structural-models.html#cb12-147" tabindex="-1"></a><span class="co">#&gt;   60  5  4</span></span>
-<span id="cb12-148"><a href="ip-weighting-and-marginal-structural-models.html#cb12-148" tabindex="-1"></a><span class="co">#&gt;   61  5  2</span></span>
-<span id="cb12-149"><a href="ip-weighting-and-marginal-structural-models.html#cb12-149" tabindex="-1"></a><span class="co">#&gt;   62  6  5</span></span>
-<span id="cb12-150"><a href="ip-weighting-and-marginal-structural-models.html#cb12-150" tabindex="-1"></a><span class="co">#&gt;   63  3  3</span></span>
-<span id="cb12-151"><a href="ip-weighting-and-marginal-structural-models.html#cb12-151" tabindex="-1"></a><span class="co">#&gt;   64  7  1</span></span>
-<span id="cb12-152"><a href="ip-weighting-and-marginal-structural-models.html#cb12-152" tabindex="-1"></a><span class="co">#&gt;   65  3  2</span></span>
-<span id="cb12-153"><a href="ip-weighting-and-marginal-structural-models.html#cb12-153" tabindex="-1"></a><span class="co">#&gt;   66  4  0</span></span>
-<span id="cb12-154"><a href="ip-weighting-and-marginal-structural-models.html#cb12-154" tabindex="-1"></a><span class="co">#&gt;   67  2  0</span></span>
-<span id="cb12-155"><a href="ip-weighting-and-marginal-structural-models.html#cb12-155" tabindex="-1"></a><span class="co">#&gt;   69  6  2</span></span>
-<span id="cb12-156"><a href="ip-weighting-and-marginal-structural-models.html#cb12-156" tabindex="-1"></a><span class="co">#&gt;   70  2  1</span></span>
-<span id="cb12-157"><a href="ip-weighting-and-marginal-structural-models.html#cb12-157" tabindex="-1"></a><span class="co">#&gt;   71  0  1</span></span>
-<span id="cb12-158"><a href="ip-weighting-and-marginal-structural-models.html#cb12-158" tabindex="-1"></a><span class="co">#&gt;   72  2  2</span></span>
-<span id="cb12-159"><a href="ip-weighting-and-marginal-structural-models.html#cb12-159" tabindex="-1"></a><span class="co">#&gt;   74  0  1</span></span></code></pre></div>
+<div class="sourceCode" id="cb40"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb40-1"><a href="ip-weighting-and-marginal-structural-models.html#cb40-1" tabindex="-1"></a><span class="co"># Estimation of ip weights via a logistic model</span></span>
+<span id="cb40-2"><a href="ip-weighting-and-marginal-structural-models.html#cb40-2" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
+<span id="cb40-3"><a href="ip-weighting-and-marginal-structural-models.html#cb40-3" tabindex="-1"></a>  qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb40-4"><a href="ip-weighting-and-marginal-structural-models.html#cb40-4" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb40-5"><a href="ip-weighting-and-marginal-structural-models.html#cb40-5" tabindex="-1"></a>    <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb40-6"><a href="ip-weighting-and-marginal-structural-models.html#cb40-6" tabindex="-1"></a>    <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb40-7"><a href="ip-weighting-and-marginal-structural-models.html#cb40-7" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb40-8"><a href="ip-weighting-and-marginal-structural-models.html#cb40-8" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv</span>
+<span id="cb40-9"><a href="ip-weighting-and-marginal-structural-models.html#cb40-9" tabindex="-1"></a>)</span>
+<span id="cb40-10"><a href="ip-weighting-and-marginal-structural-models.html#cb40-10" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
+<span id="cb40-11"><a href="ip-weighting-and-marginal-structural-models.html#cb40-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb40-12"><a href="ip-weighting-and-marginal-structural-models.html#cb40-12" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb40-13"><a href="ip-weighting-and-marginal-structural-models.html#cb40-13" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + </span></span>
+<span id="cb40-14"><a href="ip-weighting-and-marginal-structural-models.html#cb40-14" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + </span></span>
+<span id="cb40-15"><a href="ip-weighting-and-marginal-structural-models.html#cb40-15" tabindex="-1"></a><span class="co">#&gt;     as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), </span></span>
+<span id="cb40-16"><a href="ip-weighting-and-marginal-structural-models.html#cb40-16" tabindex="-1"></a><span class="co">#&gt;     family = binomial(), data = nhefs.nmv)</span></span>
+<span id="cb40-17"><a href="ip-weighting-and-marginal-structural-models.html#cb40-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb40-18"><a href="ip-weighting-and-marginal-structural-models.html#cb40-18" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb40-19"><a href="ip-weighting-and-marginal-structural-models.html#cb40-19" tabindex="-1"></a><span class="co">#&gt;                         Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb40-20"><a href="ip-weighting-and-marginal-structural-models.html#cb40-20" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.2425191  1.3808360  -1.624 0.104369    </span></span>
+<span id="cb40-21"><a href="ip-weighting-and-marginal-structural-models.html#cb40-21" tabindex="-1"></a><span class="co">#&gt; sex                   -0.5274782  0.1540496  -3.424 0.000617 ***</span></span>
+<span id="cb40-22"><a href="ip-weighting-and-marginal-structural-models.html#cb40-22" tabindex="-1"></a><span class="co">#&gt; race                  -0.8392636  0.2100665  -3.995 6.46e-05 ***</span></span>
+<span id="cb40-23"><a href="ip-weighting-and-marginal-structural-models.html#cb40-23" tabindex="-1"></a><span class="co">#&gt; age                    0.1212052  0.0512663   2.364 0.018068 *  </span></span>
+<span id="cb40-24"><a href="ip-weighting-and-marginal-structural-models.html#cb40-24" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.0008246  0.0005361  -1.538 0.124039    </span></span>
+<span id="cb40-25"><a href="ip-weighting-and-marginal-structural-models.html#cb40-25" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.0287755  0.1983506  -0.145 0.884653    </span></span>
+<span id="cb40-26"><a href="ip-weighting-and-marginal-structural-models.html#cb40-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.0864318  0.1780850   0.485 0.627435    </span></span>
+<span id="cb40-27"><a href="ip-weighting-and-marginal-structural-models.html#cb40-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.0636010  0.2732108   0.233 0.815924    </span></span>
+<span id="cb40-28"><a href="ip-weighting-and-marginal-structural-models.html#cb40-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.4759606  0.2262237   2.104 0.035384 *  </span></span>
+<span id="cb40-29"><a href="ip-weighting-and-marginal-structural-models.html#cb40-29" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.0772704  0.0152499  -5.067 4.04e-07 ***</span></span>
+<span id="cb40-30"><a href="ip-weighting-and-marginal-structural-models.html#cb40-30" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.0010451  0.0002866   3.647 0.000265 ***</span></span>
+<span id="cb40-31"><a href="ip-weighting-and-marginal-structural-models.html#cb40-31" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.0735966  0.0277775  -2.650 0.008061 ** </span></span>
+<span id="cb40-32"><a href="ip-weighting-and-marginal-structural-models.html#cb40-32" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.0008441  0.0004632   1.822 0.068398 .  </span></span>
+<span id="cb40-33"><a href="ip-weighting-and-marginal-structural-models.html#cb40-33" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.3548405  0.1801351   1.970 0.048855 *  </span></span>
+<span id="cb40-34"><a href="ip-weighting-and-marginal-structural-models.html#cb40-34" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.3957040  0.1872400   2.113 0.034571 *  </span></span>
+<span id="cb40-35"><a href="ip-weighting-and-marginal-structural-models.html#cb40-35" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.0319445  0.1329372   0.240 0.810100    </span></span>
+<span id="cb40-36"><a href="ip-weighting-and-marginal-structural-models.html#cb40-36" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.1767840  0.2149720   0.822 0.410873    </span></span>
+<span id="cb40-37"><a href="ip-weighting-and-marginal-structural-models.html#cb40-37" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.0152357  0.0263161  -0.579 0.562625    </span></span>
+<span id="cb40-38"><a href="ip-weighting-and-marginal-structural-models.html#cb40-38" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.0001352  0.0001632   0.829 0.407370    </span></span>
+<span id="cb40-39"><a href="ip-weighting-and-marginal-structural-models.html#cb40-39" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb40-40"><a href="ip-weighting-and-marginal-structural-models.html#cb40-40" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb40-41"><a href="ip-weighting-and-marginal-structural-models.html#cb40-41" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb40-42"><a href="ip-weighting-and-marginal-structural-models.html#cb40-42" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb40-43"><a href="ip-weighting-and-marginal-structural-models.html#cb40-43" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb40-44"><a href="ip-weighting-and-marginal-structural-models.html#cb40-44" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb40-45"><a href="ip-weighting-and-marginal-structural-models.html#cb40-45" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
+<span id="cb40-46"><a href="ip-weighting-and-marginal-structural-models.html#cb40-46" tabindex="-1"></a><span class="co">#&gt; AIC: 1714.9</span></span>
+<span id="cb40-47"><a href="ip-weighting-and-marginal-structural-models.html#cb40-47" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb40-48"><a href="ip-weighting-and-marginal-structural-models.html#cb40-48" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb41"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb41-1"><a href="ip-weighting-and-marginal-structural-models.html#cb41-1" tabindex="-1"></a></span>
+<span id="cb41-2"><a href="ip-weighting-and-marginal-structural-models.html#cb41-2" tabindex="-1"></a>p.qsmk.obs <span class="ot">&lt;-</span></span>
+<span id="cb41-3"><a href="ip-weighting-and-marginal-structural-models.html#cb41-3" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>,</span>
+<span id="cb41-4"><a href="ip-weighting-and-marginal-structural-models.html#cb41-4" tabindex="-1"></a>         <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>),</span>
+<span id="cb41-5"><a href="ip-weighting-and-marginal-structural-models.html#cb41-5" tabindex="-1"></a>         <span class="fu">predict</span>(fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>))</span>
+<span id="cb41-6"><a href="ip-weighting-and-marginal-structural-models.html#cb41-6" tabindex="-1"></a></span>
+<span id="cb41-7"><a href="ip-weighting-and-marginal-structural-models.html#cb41-7" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>w <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">/</span> p.qsmk.obs</span>
+<span id="cb41-8"><a href="ip-weighting-and-marginal-structural-models.html#cb41-8" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>w)</span>
+<span id="cb41-9"><a href="ip-weighting-and-marginal-structural-models.html#cb41-9" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb41-10"><a href="ip-weighting-and-marginal-structural-models.html#cb41-10" tabindex="-1"></a><span class="co">#&gt;   1.054   1.230   1.373   1.996   1.990  16.700</span></span></code></pre></div>
+<div class="sourceCode" id="cb42"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb42-1"><a href="ip-weighting-and-marginal-structural-models.html#cb42-1" tabindex="-1"></a><span class="fu">sd</span>(nhefs.nmv<span class="sc">$</span>w)</span>
+<span id="cb42-2"><a href="ip-weighting-and-marginal-structural-models.html#cb42-2" tabindex="-1"></a><span class="co">#&gt; [1] 1.474787</span></span></code></pre></div>
+<div class="sourceCode" id="cb43"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb43-1"><a href="ip-weighting-and-marginal-structural-models.html#cb43-1" tabindex="-1"></a></span>
+<span id="cb43-2"><a href="ip-weighting-and-marginal-structural-models.html#cb43-2" tabindex="-1"></a><span class="co"># install.packages(&quot;geepack&quot;) # install package if required</span></span>
+<span id="cb43-3"><a href="ip-weighting-and-marginal-structural-models.html#cb43-3" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;geepack&quot;</span>)</span>
+<span id="cb43-4"><a href="ip-weighting-and-marginal-structural-models.html#cb43-4" tabindex="-1"></a>msm.w <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
+<span id="cb43-5"><a href="ip-weighting-and-marginal-structural-models.html#cb43-5" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
+<span id="cb43-6"><a href="ip-weighting-and-marginal-structural-models.html#cb43-6" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
+<span id="cb43-7"><a href="ip-weighting-and-marginal-structural-models.html#cb43-7" tabindex="-1"></a>  <span class="at">weights =</span> w,</span>
+<span id="cb43-8"><a href="ip-weighting-and-marginal-structural-models.html#cb43-8" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
+<span id="cb43-9"><a href="ip-weighting-and-marginal-structural-models.html#cb43-9" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb43-10"><a href="ip-weighting-and-marginal-structural-models.html#cb43-10" tabindex="-1"></a>)</span>
+<span id="cb43-11"><a href="ip-weighting-and-marginal-structural-models.html#cb43-11" tabindex="-1"></a><span class="fu">summary</span>(msm.w)</span>
+<span id="cb43-12"><a href="ip-weighting-and-marginal-structural-models.html#cb43-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb43-13"><a href="ip-weighting-and-marginal-structural-models.html#cb43-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb43-14"><a href="ip-weighting-and-marginal-structural-models.html#cb43-14" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, </span></span>
+<span id="cb43-15"><a href="ip-weighting-and-marginal-structural-models.html#cb43-15" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb43-16"><a href="ip-weighting-and-marginal-structural-models.html#cb43-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb43-17"><a href="ip-weighting-and-marginal-structural-models.html#cb43-17" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb43-18"><a href="ip-weighting-and-marginal-structural-models.html#cb43-18" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err  Wald Pr(&gt;|W|)    </span></span>
+<span id="cb43-19"><a href="ip-weighting-and-marginal-structural-models.html#cb43-19" tabindex="-1"></a><span class="co">#&gt; (Intercept)   1.7800  0.2247 62.73 2.33e-15 ***</span></span>
+<span id="cb43-20"><a href="ip-weighting-and-marginal-structural-models.html#cb43-20" tabindex="-1"></a><span class="co">#&gt; qsmk          3.4405  0.5255 42.87 5.86e-11 ***</span></span>
+<span id="cb43-21"><a href="ip-weighting-and-marginal-structural-models.html#cb43-21" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb43-22"><a href="ip-weighting-and-marginal-structural-models.html#cb43-22" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb43-23"><a href="ip-weighting-and-marginal-structural-models.html#cb43-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb43-24"><a href="ip-weighting-and-marginal-structural-models.html#cb43-24" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb43-25"><a href="ip-weighting-and-marginal-structural-models.html#cb43-25" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb43-26"><a href="ip-weighting-and-marginal-structural-models.html#cb43-26" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb43-27"><a href="ip-weighting-and-marginal-structural-models.html#cb43-27" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb43-28"><a href="ip-weighting-and-marginal-structural-models.html#cb43-28" tabindex="-1"></a><span class="co">#&gt; (Intercept)    65.06   4.221</span></span>
+<span id="cb43-29"><a href="ip-weighting-and-marginal-structural-models.html#cb43-29" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb44"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb44-1"><a href="ip-weighting-and-marginal-structural-models.html#cb44-1" tabindex="-1"></a></span>
+<span id="cb44-2"><a href="ip-weighting-and-marginal-structural-models.html#cb44-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.w)</span>
+<span id="cb44-3"><a href="ip-weighting-and-marginal-structural-models.html#cb44-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.w))[, <span class="dv">2</span>]</span>
+<span id="cb44-4"><a href="ip-weighting-and-marginal-structural-models.html#cb44-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb44-5"><a href="ip-weighting-and-marginal-structural-models.html#cb44-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb44-6"><a href="ip-weighting-and-marginal-structural-models.html#cb44-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb44-7"><a href="ip-weighting-and-marginal-structural-models.html#cb44-7" tabindex="-1"></a><span class="co">#&gt;              beta   lcl  ucl</span></span>
+<span id="cb44-8"><a href="ip-weighting-and-marginal-structural-models.html#cb44-8" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.780 1.340 2.22</span></span>
+<span id="cb44-9"><a href="ip-weighting-and-marginal-structural-models.html#cb44-9" tabindex="-1"></a><span class="co">#&gt; qsmk        3.441 2.411 4.47</span></span></code></pre></div>
+<div class="sourceCode" id="cb45"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb45-1"><a href="ip-weighting-and-marginal-structural-models.html#cb45-1" tabindex="-1"></a></span>
+<span id="cb45-2"><a href="ip-weighting-and-marginal-structural-models.html#cb45-2" tabindex="-1"></a><span class="co"># no association between sex and qsmk in pseudo-population</span></span>
+<span id="cb45-3"><a href="ip-weighting-and-marginal-structural-models.html#cb45-3" tabindex="-1"></a><span class="fu">xtabs</span>(nhefs.nmv<span class="sc">$</span>w <span class="sc">~</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">+</span> nhefs.nmv<span class="sc">$</span>qsmk)</span>
+<span id="cb45-4"><a href="ip-weighting-and-marginal-structural-models.html#cb45-4" tabindex="-1"></a><span class="co">#&gt;              nhefs.nmv$qsmk</span></span>
+<span id="cb45-5"><a href="ip-weighting-and-marginal-structural-models.html#cb45-5" tabindex="-1"></a><span class="co">#&gt; nhefs.nmv$sex     0     1</span></span>
+<span id="cb45-6"><a href="ip-weighting-and-marginal-structural-models.html#cb45-6" tabindex="-1"></a><span class="co">#&gt;             0 763.6 763.6</span></span>
+<span id="cb45-7"><a href="ip-weighting-and-marginal-structural-models.html#cb45-7" tabindex="-1"></a><span class="co">#&gt;             1 801.7 797.2</span></span></code></pre></div>
+<div class="sourceCode" id="cb46"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb46-1"><a href="ip-weighting-and-marginal-structural-models.html#cb46-1" tabindex="-1"></a></span>
+<span id="cb46-2"><a href="ip-weighting-and-marginal-structural-models.html#cb46-2" tabindex="-1"></a><span class="co"># &quot;check&quot; for positivity (White women)</span></span>
+<span id="cb46-3"><a href="ip-weighting-and-marginal-structural-models.html#cb46-3" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>age[nhefs.nmv<span class="sc">$</span>race <span class="sc">==</span> <span class="dv">0</span> <span class="sc">&amp;</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">==</span> <span class="dv">1</span>],</span>
+<span id="cb46-4"><a href="ip-weighting-and-marginal-structural-models.html#cb46-4" tabindex="-1"></a>      nhefs.nmv<span class="sc">$</span>qsmk[nhefs.nmv<span class="sc">$</span>race <span class="sc">==</span> <span class="dv">0</span> <span class="sc">&amp;</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">==</span> <span class="dv">1</span>])</span>
+<span id="cb46-5"><a href="ip-weighting-and-marginal-structural-models.html#cb46-5" tabindex="-1"></a><span class="co">#&gt;     </span></span>
+<span id="cb46-6"><a href="ip-weighting-and-marginal-structural-models.html#cb46-6" tabindex="-1"></a><span class="co">#&gt;       0  1</span></span>
+<span id="cb46-7"><a href="ip-weighting-and-marginal-structural-models.html#cb46-7" tabindex="-1"></a><span class="co">#&gt;   25 24  3</span></span>
+<span id="cb46-8"><a href="ip-weighting-and-marginal-structural-models.html#cb46-8" tabindex="-1"></a><span class="co">#&gt;   26 14  5</span></span>
+<span id="cb46-9"><a href="ip-weighting-and-marginal-structural-models.html#cb46-9" tabindex="-1"></a><span class="co">#&gt;   27 18  2</span></span>
+<span id="cb46-10"><a href="ip-weighting-and-marginal-structural-models.html#cb46-10" tabindex="-1"></a><span class="co">#&gt;   28 20  5</span></span>
+<span id="cb46-11"><a href="ip-weighting-and-marginal-structural-models.html#cb46-11" tabindex="-1"></a><span class="co">#&gt;   29 15  4</span></span>
+<span id="cb46-12"><a href="ip-weighting-and-marginal-structural-models.html#cb46-12" tabindex="-1"></a><span class="co">#&gt;   30 14  5</span></span>
+<span id="cb46-13"><a href="ip-weighting-and-marginal-structural-models.html#cb46-13" tabindex="-1"></a><span class="co">#&gt;   31 11  5</span></span>
+<span id="cb46-14"><a href="ip-weighting-and-marginal-structural-models.html#cb46-14" tabindex="-1"></a><span class="co">#&gt;   32 14  7</span></span>
+<span id="cb46-15"><a href="ip-weighting-and-marginal-structural-models.html#cb46-15" tabindex="-1"></a><span class="co">#&gt;   33 12  3</span></span>
+<span id="cb46-16"><a href="ip-weighting-and-marginal-structural-models.html#cb46-16" tabindex="-1"></a><span class="co">#&gt;   34 22  5</span></span>
+<span id="cb46-17"><a href="ip-weighting-and-marginal-structural-models.html#cb46-17" tabindex="-1"></a><span class="co">#&gt;   35 16  5</span></span>
+<span id="cb46-18"><a href="ip-weighting-and-marginal-structural-models.html#cb46-18" tabindex="-1"></a><span class="co">#&gt;   36 13  3</span></span>
+<span id="cb46-19"><a href="ip-weighting-and-marginal-structural-models.html#cb46-19" tabindex="-1"></a><span class="co">#&gt;   37 14  1</span></span>
+<span id="cb46-20"><a href="ip-weighting-and-marginal-structural-models.html#cb46-20" tabindex="-1"></a><span class="co">#&gt;   38  6  2</span></span>
+<span id="cb46-21"><a href="ip-weighting-and-marginal-structural-models.html#cb46-21" tabindex="-1"></a><span class="co">#&gt;   39 19  4</span></span>
+<span id="cb46-22"><a href="ip-weighting-and-marginal-structural-models.html#cb46-22" tabindex="-1"></a><span class="co">#&gt;   40 10  4</span></span>
+<span id="cb46-23"><a href="ip-weighting-and-marginal-structural-models.html#cb46-23" tabindex="-1"></a><span class="co">#&gt;   41 13  3</span></span>
+<span id="cb46-24"><a href="ip-weighting-and-marginal-structural-models.html#cb46-24" tabindex="-1"></a><span class="co">#&gt;   42 16  3</span></span>
+<span id="cb46-25"><a href="ip-weighting-and-marginal-structural-models.html#cb46-25" tabindex="-1"></a><span class="co">#&gt;   43 14  3</span></span>
+<span id="cb46-26"><a href="ip-weighting-and-marginal-structural-models.html#cb46-26" tabindex="-1"></a><span class="co">#&gt;   44  9  4</span></span>
+<span id="cb46-27"><a href="ip-weighting-and-marginal-structural-models.html#cb46-27" tabindex="-1"></a><span class="co">#&gt;   45 12  5</span></span>
+<span id="cb46-28"><a href="ip-weighting-and-marginal-structural-models.html#cb46-28" tabindex="-1"></a><span class="co">#&gt;   46 19  4</span></span>
+<span id="cb46-29"><a href="ip-weighting-and-marginal-structural-models.html#cb46-29" tabindex="-1"></a><span class="co">#&gt;   47 19  4</span></span>
+<span id="cb46-30"><a href="ip-weighting-and-marginal-structural-models.html#cb46-30" tabindex="-1"></a><span class="co">#&gt;   48 19  4</span></span>
+<span id="cb46-31"><a href="ip-weighting-and-marginal-structural-models.html#cb46-31" tabindex="-1"></a><span class="co">#&gt;   49 11  3</span></span>
+<span id="cb46-32"><a href="ip-weighting-and-marginal-structural-models.html#cb46-32" tabindex="-1"></a><span class="co">#&gt;   50 18  4</span></span>
+<span id="cb46-33"><a href="ip-weighting-and-marginal-structural-models.html#cb46-33" tabindex="-1"></a><span class="co">#&gt;   51  9  3</span></span>
+<span id="cb46-34"><a href="ip-weighting-and-marginal-structural-models.html#cb46-34" tabindex="-1"></a><span class="co">#&gt;   52 11  3</span></span>
+<span id="cb46-35"><a href="ip-weighting-and-marginal-structural-models.html#cb46-35" tabindex="-1"></a><span class="co">#&gt;   53 11  4</span></span>
+<span id="cb46-36"><a href="ip-weighting-and-marginal-structural-models.html#cb46-36" tabindex="-1"></a><span class="co">#&gt;   54 17  9</span></span>
+<span id="cb46-37"><a href="ip-weighting-and-marginal-structural-models.html#cb46-37" tabindex="-1"></a><span class="co">#&gt;   55  9  4</span></span>
+<span id="cb46-38"><a href="ip-weighting-and-marginal-structural-models.html#cb46-38" tabindex="-1"></a><span class="co">#&gt;   56  8  7</span></span>
+<span id="cb46-39"><a href="ip-weighting-and-marginal-structural-models.html#cb46-39" tabindex="-1"></a><span class="co">#&gt;   57  9  2</span></span>
+<span id="cb46-40"><a href="ip-weighting-and-marginal-structural-models.html#cb46-40" tabindex="-1"></a><span class="co">#&gt;   58  8  4</span></span>
+<span id="cb46-41"><a href="ip-weighting-and-marginal-structural-models.html#cb46-41" tabindex="-1"></a><span class="co">#&gt;   59  5  4</span></span>
+<span id="cb46-42"><a href="ip-weighting-and-marginal-structural-models.html#cb46-42" tabindex="-1"></a><span class="co">#&gt;   60  5  4</span></span>
+<span id="cb46-43"><a href="ip-weighting-and-marginal-structural-models.html#cb46-43" tabindex="-1"></a><span class="co">#&gt;   61  5  2</span></span>
+<span id="cb46-44"><a href="ip-weighting-and-marginal-structural-models.html#cb46-44" tabindex="-1"></a><span class="co">#&gt;   62  6  5</span></span>
+<span id="cb46-45"><a href="ip-weighting-and-marginal-structural-models.html#cb46-45" tabindex="-1"></a><span class="co">#&gt;   63  3  3</span></span>
+<span id="cb46-46"><a href="ip-weighting-and-marginal-structural-models.html#cb46-46" tabindex="-1"></a><span class="co">#&gt;   64  7  1</span></span>
+<span id="cb46-47"><a href="ip-weighting-and-marginal-structural-models.html#cb46-47" tabindex="-1"></a><span class="co">#&gt;   65  3  2</span></span>
+<span id="cb46-48"><a href="ip-weighting-and-marginal-structural-models.html#cb46-48" tabindex="-1"></a><span class="co">#&gt;   66  4  0</span></span>
+<span id="cb46-49"><a href="ip-weighting-and-marginal-structural-models.html#cb46-49" tabindex="-1"></a><span class="co">#&gt;   67  2  0</span></span>
+<span id="cb46-50"><a href="ip-weighting-and-marginal-structural-models.html#cb46-50" tabindex="-1"></a><span class="co">#&gt;   69  6  2</span></span>
+<span id="cb46-51"><a href="ip-weighting-and-marginal-structural-models.html#cb46-51" tabindex="-1"></a><span class="co">#&gt;   70  2  1</span></span>
+<span id="cb46-52"><a href="ip-weighting-and-marginal-structural-models.html#cb46-52" tabindex="-1"></a><span class="co">#&gt;   71  0  1</span></span>
+<span id="cb46-53"><a href="ip-weighting-and-marginal-structural-models.html#cb46-53" tabindex="-1"></a><span class="co">#&gt;   72  2  2</span></span>
+<span id="cb46-54"><a href="ip-weighting-and-marginal-structural-models.html#cb46-54" tabindex="-1"></a><span class="co">#&gt;   74  0  1</span></span></code></pre></div>
 </div>
 <div id="program-12.3" class="section level2 hasAnchor">
 <h2>Program 12.3<a href="ip-weighting-and-marginal-structural-models.html#program-12.3" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -597,208 +597,208 @@ <h2>Program 12.3<a href="ip-weighting-and-marginal-structural-models.html#progra
 <li>Estimating stabilized IP weights</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb13"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb13-1"><a href="ip-weighting-and-marginal-structural-models.html#cb13-1" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
-<span id="cb13-2"><a href="ip-weighting-and-marginal-structural-models.html#cb13-2" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
-<span id="cb13-3"><a href="ip-weighting-and-marginal-structural-models.html#cb13-3" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
-<span id="cb13-4"><a href="ip-weighting-and-marginal-structural-models.html#cb13-4" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb13-5"><a href="ip-weighting-and-marginal-structural-models.html#cb13-5" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb13-6"><a href="ip-weighting-and-marginal-structural-models.html#cb13-6" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb13-7"><a href="ip-weighting-and-marginal-structural-models.html#cb13-7" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb13-8"><a href="ip-weighting-and-marginal-structural-models.html#cb13-8" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb13-9"><a href="ip-weighting-and-marginal-structural-models.html#cb13-9" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv</span>
-<span id="cb13-10"><a href="ip-weighting-and-marginal-structural-models.html#cb13-10" tabindex="-1"></a>  )</span>
-<span id="cb13-11"><a href="ip-weighting-and-marginal-structural-models.html#cb13-11" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
-<span id="cb13-12"><a href="ip-weighting-and-marginal-structural-models.html#cb13-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-13"><a href="ip-weighting-and-marginal-structural-models.html#cb13-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb13-14"><a href="ip-weighting-and-marginal-structural-models.html#cb13-14" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
-<span id="cb13-15"><a href="ip-weighting-and-marginal-structural-models.html#cb13-15" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
-<span id="cb13-16"><a href="ip-weighting-and-marginal-structural-models.html#cb13-16" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb13-17"><a href="ip-weighting-and-marginal-structural-models.html#cb13-17" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv)</span></span>
-<span id="cb13-18"><a href="ip-weighting-and-marginal-structural-models.html#cb13-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-19"><a href="ip-weighting-and-marginal-structural-models.html#cb13-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb13-20"><a href="ip-weighting-and-marginal-structural-models.html#cb13-20" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb13-21"><a href="ip-weighting-and-marginal-structural-models.html#cb13-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.242519   1.380836   -1.62  0.10437    </span></span>
-<span id="cb13-22"><a href="ip-weighting-and-marginal-structural-models.html#cb13-22" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.527478   0.154050   -3.42  0.00062 ***</span></span>
-<span id="cb13-23"><a href="ip-weighting-and-marginal-structural-models.html#cb13-23" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.839264   0.210067   -4.00  6.5e-05 ***</span></span>
-<span id="cb13-24"><a href="ip-weighting-and-marginal-structural-models.html#cb13-24" tabindex="-1"></a><span class="co">#&gt; age                    0.121205   0.051266    2.36  0.01807 *  </span></span>
-<span id="cb13-25"><a href="ip-weighting-and-marginal-structural-models.html#cb13-25" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000825   0.000536   -1.54  0.12404    </span></span>
-<span id="cb13-26"><a href="ip-weighting-and-marginal-structural-models.html#cb13-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.028776   0.198351   -0.15  0.88465    </span></span>
-<span id="cb13-27"><a href="ip-weighting-and-marginal-structural-models.html#cb13-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.086432   0.178085    0.49  0.62744    </span></span>
-<span id="cb13-28"><a href="ip-weighting-and-marginal-structural-models.html#cb13-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.063601   0.273211    0.23  0.81592    </span></span>
-<span id="cb13-29"><a href="ip-weighting-and-marginal-structural-models.html#cb13-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.475961   0.226224    2.10  0.03538 *  </span></span>
-<span id="cb13-30"><a href="ip-weighting-and-marginal-structural-models.html#cb13-30" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.077270   0.015250   -5.07  4.0e-07 ***</span></span>
-<span id="cb13-31"><a href="ip-weighting-and-marginal-structural-models.html#cb13-31" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.001045   0.000287    3.65  0.00027 ***</span></span>
-<span id="cb13-32"><a href="ip-weighting-and-marginal-structural-models.html#cb13-32" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073597   0.027777   -2.65  0.00806 ** </span></span>
-<span id="cb13-33"><a href="ip-weighting-and-marginal-structural-models.html#cb13-33" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000844   0.000463    1.82  0.06840 .  </span></span>
-<span id="cb13-34"><a href="ip-weighting-and-marginal-structural-models.html#cb13-34" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.354841   0.180135    1.97  0.04885 *  </span></span>
-<span id="cb13-35"><a href="ip-weighting-and-marginal-structural-models.html#cb13-35" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.395704   0.187240    2.11  0.03457 *  </span></span>
-<span id="cb13-36"><a href="ip-weighting-and-marginal-structural-models.html#cb13-36" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.031944   0.132937    0.24  0.81010    </span></span>
-<span id="cb13-37"><a href="ip-weighting-and-marginal-structural-models.html#cb13-37" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.176784   0.214972    0.82  0.41087    </span></span>
-<span id="cb13-38"><a href="ip-weighting-and-marginal-structural-models.html#cb13-38" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.015236   0.026316   -0.58  0.56262    </span></span>
-<span id="cb13-39"><a href="ip-weighting-and-marginal-structural-models.html#cb13-39" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000135   0.000163    0.83  0.40737    </span></span>
-<span id="cb13-40"><a href="ip-weighting-and-marginal-structural-models.html#cb13-40" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb13-41"><a href="ip-weighting-and-marginal-structural-models.html#cb13-41" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb13-42"><a href="ip-weighting-and-marginal-structural-models.html#cb13-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-43"><a href="ip-weighting-and-marginal-structural-models.html#cb13-43" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb13-44"><a href="ip-weighting-and-marginal-structural-models.html#cb13-44" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-45"><a href="ip-weighting-and-marginal-structural-models.html#cb13-45" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb13-46"><a href="ip-weighting-and-marginal-structural-models.html#cb13-46" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
-<span id="cb13-47"><a href="ip-weighting-and-marginal-structural-models.html#cb13-47" tabindex="-1"></a><span class="co">#&gt; AIC: 1715</span></span>
-<span id="cb13-48"><a href="ip-weighting-and-marginal-structural-models.html#cb13-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-49"><a href="ip-weighting-and-marginal-structural-models.html#cb13-49" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb13-50"><a href="ip-weighting-and-marginal-structural-models.html#cb13-50" tabindex="-1"></a></span>
-<span id="cb13-51"><a href="ip-weighting-and-marginal-structural-models.html#cb13-51" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb13-52"><a href="ip-weighting-and-marginal-structural-models.html#cb13-52" tabindex="-1"></a></span>
-<span id="cb13-53"><a href="ip-weighting-and-marginal-structural-models.html#cb13-53" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
-<span id="cb13-54"><a href="ip-weighting-and-marginal-structural-models.html#cb13-54" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs.nmv)</span>
-<span id="cb13-55"><a href="ip-weighting-and-marginal-structural-models.html#cb13-55" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
-<span id="cb13-56"><a href="ip-weighting-and-marginal-structural-models.html#cb13-56" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-57"><a href="ip-weighting-and-marginal-structural-models.html#cb13-57" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb13-58"><a href="ip-weighting-and-marginal-structural-models.html#cb13-58" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs.nmv)</span></span>
-<span id="cb13-59"><a href="ip-weighting-and-marginal-structural-models.html#cb13-59" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-60"><a href="ip-weighting-and-marginal-structural-models.html#cb13-60" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb13-61"><a href="ip-weighting-and-marginal-structural-models.html#cb13-61" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb13-62"><a href="ip-weighting-and-marginal-structural-models.html#cb13-62" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.0598     0.0578   -18.3   &lt;2e-16 ***</span></span>
-<span id="cb13-63"><a href="ip-weighting-and-marginal-structural-models.html#cb13-63" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb13-64"><a href="ip-weighting-and-marginal-structural-models.html#cb13-64" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb13-65"><a href="ip-weighting-and-marginal-structural-models.html#cb13-65" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-66"><a href="ip-weighting-and-marginal-structural-models.html#cb13-66" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb13-67"><a href="ip-weighting-and-marginal-structural-models.html#cb13-67" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-68"><a href="ip-weighting-and-marginal-structural-models.html#cb13-68" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb13-69"><a href="ip-weighting-and-marginal-structural-models.html#cb13-69" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb13-70"><a href="ip-weighting-and-marginal-structural-models.html#cb13-70" tabindex="-1"></a><span class="co">#&gt; AIC: 1788</span></span>
-<span id="cb13-71"><a href="ip-weighting-and-marginal-structural-models.html#cb13-71" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-72"><a href="ip-weighting-and-marginal-structural-models.html#cb13-72" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb13-73"><a href="ip-weighting-and-marginal-structural-models.html#cb13-73" tabindex="-1"></a></span>
-<span id="cb13-74"><a href="ip-weighting-and-marginal-structural-models.html#cb13-74" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb13-75"><a href="ip-weighting-and-marginal-structural-models.html#cb13-75" tabindex="-1"></a></span>
-<span id="cb13-76"><a href="ip-weighting-and-marginal-structural-models.html#cb13-76" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>sw <span class="ot">&lt;-</span></span>
-<span id="cb13-77"><a href="ip-weighting-and-marginal-structural-models.html#cb13-77" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
-<span id="cb13-78"><a href="ip-weighting-and-marginal-structural-models.html#cb13-78" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
-<span id="cb13-79"><a href="ip-weighting-and-marginal-structural-models.html#cb13-79" tabindex="-1"></a></span>
-<span id="cb13-80"><a href="ip-weighting-and-marginal-structural-models.html#cb13-80" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>sw)</span>
-<span id="cb13-81"><a href="ip-weighting-and-marginal-structural-models.html#cb13-81" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb13-82"><a href="ip-weighting-and-marginal-structural-models.html#cb13-82" tabindex="-1"></a><span class="co">#&gt;   0.331   0.867   0.950   0.999   1.079   4.298</span></span>
-<span id="cb13-83"><a href="ip-weighting-and-marginal-structural-models.html#cb13-83" tabindex="-1"></a></span>
-<span id="cb13-84"><a href="ip-weighting-and-marginal-structural-models.html#cb13-84" tabindex="-1"></a></span>
-<span id="cb13-85"><a href="ip-weighting-and-marginal-structural-models.html#cb13-85" tabindex="-1"></a>msm.sw <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
-<span id="cb13-86"><a href="ip-weighting-and-marginal-structural-models.html#cb13-86" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
-<span id="cb13-87"><a href="ip-weighting-and-marginal-structural-models.html#cb13-87" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
-<span id="cb13-88"><a href="ip-weighting-and-marginal-structural-models.html#cb13-88" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
-<span id="cb13-89"><a href="ip-weighting-and-marginal-structural-models.html#cb13-89" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
-<span id="cb13-90"><a href="ip-weighting-and-marginal-structural-models.html#cb13-90" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb13-91"><a href="ip-weighting-and-marginal-structural-models.html#cb13-91" tabindex="-1"></a>)</span>
-<span id="cb13-92"><a href="ip-weighting-and-marginal-structural-models.html#cb13-92" tabindex="-1"></a><span class="fu">summary</span>(msm.sw)</span>
-<span id="cb13-93"><a href="ip-weighting-and-marginal-structural-models.html#cb13-93" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-94"><a href="ip-weighting-and-marginal-structural-models.html#cb13-94" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb13-95"><a href="ip-weighting-and-marginal-structural-models.html#cb13-95" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, </span></span>
-<span id="cb13-96"><a href="ip-weighting-and-marginal-structural-models.html#cb13-96" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb13-97"><a href="ip-weighting-and-marginal-structural-models.html#cb13-97" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-98"><a href="ip-weighting-and-marginal-structural-models.html#cb13-98" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb13-99"><a href="ip-weighting-and-marginal-structural-models.html#cb13-99" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err Wald Pr(&gt;|W|)    </span></span>
-<span id="cb13-100"><a href="ip-weighting-and-marginal-structural-models.html#cb13-100" tabindex="-1"></a><span class="co">#&gt; (Intercept)    1.780   0.225 62.7  2.3e-15 ***</span></span>
-<span id="cb13-101"><a href="ip-weighting-and-marginal-structural-models.html#cb13-101" tabindex="-1"></a><span class="co">#&gt; qsmk           3.441   0.525 42.9  5.9e-11 ***</span></span>
-<span id="cb13-102"><a href="ip-weighting-and-marginal-structural-models.html#cb13-102" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb13-103"><a href="ip-weighting-and-marginal-structural-models.html#cb13-103" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb13-104"><a href="ip-weighting-and-marginal-structural-models.html#cb13-104" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-105"><a href="ip-weighting-and-marginal-structural-models.html#cb13-105" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb13-106"><a href="ip-weighting-and-marginal-structural-models.html#cb13-106" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb13-107"><a href="ip-weighting-and-marginal-structural-models.html#cb13-107" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb13-108"><a href="ip-weighting-and-marginal-structural-models.html#cb13-108" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb13-109"><a href="ip-weighting-and-marginal-structural-models.html#cb13-109" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.7    3.71</span></span>
-<span id="cb13-110"><a href="ip-weighting-and-marginal-structural-models.html#cb13-110" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span>
-<span id="cb13-111"><a href="ip-weighting-and-marginal-structural-models.html#cb13-111" tabindex="-1"></a></span>
-<span id="cb13-112"><a href="ip-weighting-and-marginal-structural-models.html#cb13-112" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw)</span>
-<span id="cb13-113"><a href="ip-weighting-and-marginal-structural-models.html#cb13-113" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw))[, <span class="dv">2</span>]</span>
-<span id="cb13-114"><a href="ip-weighting-and-marginal-structural-models.html#cb13-114" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb13-115"><a href="ip-weighting-and-marginal-structural-models.html#cb13-115" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb13-116"><a href="ip-weighting-and-marginal-structural-models.html#cb13-116" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb13-117"><a href="ip-weighting-and-marginal-structural-models.html#cb13-117" tabindex="-1"></a><span class="co">#&gt;             beta  lcl  ucl</span></span>
-<span id="cb13-118"><a href="ip-weighting-and-marginal-structural-models.html#cb13-118" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.78 1.34 2.22</span></span>
-<span id="cb13-119"><a href="ip-weighting-and-marginal-structural-models.html#cb13-119" tabindex="-1"></a><span class="co">#&gt; qsmk        3.44 2.41 4.47</span></span>
-<span id="cb13-120"><a href="ip-weighting-and-marginal-structural-models.html#cb13-120" tabindex="-1"></a></span>
-<span id="cb13-121"><a href="ip-weighting-and-marginal-structural-models.html#cb13-121" tabindex="-1"></a><span class="co"># no association between sex and qsmk in pseudo-population</span></span>
-<span id="cb13-122"><a href="ip-weighting-and-marginal-structural-models.html#cb13-122" tabindex="-1"></a><span class="fu">xtabs</span>(nhefs.nmv<span class="sc">$</span>sw <span class="sc">~</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">+</span> nhefs.nmv<span class="sc">$</span>qsmk)</span>
-<span id="cb13-123"><a href="ip-weighting-and-marginal-structural-models.html#cb13-123" tabindex="-1"></a><span class="co">#&gt;              nhefs.nmv$qsmk</span></span>
-<span id="cb13-124"><a href="ip-weighting-and-marginal-structural-models.html#cb13-124" tabindex="-1"></a><span class="co">#&gt; nhefs.nmv$sex   0   1</span></span>
-<span id="cb13-125"><a href="ip-weighting-and-marginal-structural-models.html#cb13-125" tabindex="-1"></a><span class="co">#&gt;             0 567 197</span></span>
-<span id="cb13-126"><a href="ip-weighting-and-marginal-structural-models.html#cb13-126" tabindex="-1"></a><span class="co">#&gt;             1 595 205</span></span></code></pre></div>
+<div class="sourceCode" id="cb47"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb47-1"><a href="ip-weighting-and-marginal-structural-models.html#cb47-1" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
+<span id="cb47-2"><a href="ip-weighting-and-marginal-structural-models.html#cb47-2" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
+<span id="cb47-3"><a href="ip-weighting-and-marginal-structural-models.html#cb47-3" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
+<span id="cb47-4"><a href="ip-weighting-and-marginal-structural-models.html#cb47-4" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb47-5"><a href="ip-weighting-and-marginal-structural-models.html#cb47-5" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb47-6"><a href="ip-weighting-and-marginal-structural-models.html#cb47-6" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb47-7"><a href="ip-weighting-and-marginal-structural-models.html#cb47-7" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb47-8"><a href="ip-weighting-and-marginal-structural-models.html#cb47-8" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb47-9"><a href="ip-weighting-and-marginal-structural-models.html#cb47-9" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv</span>
+<span id="cb47-10"><a href="ip-weighting-and-marginal-structural-models.html#cb47-10" tabindex="-1"></a>  )</span>
+<span id="cb47-11"><a href="ip-weighting-and-marginal-structural-models.html#cb47-11" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
+<span id="cb47-12"><a href="ip-weighting-and-marginal-structural-models.html#cb47-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb47-13"><a href="ip-weighting-and-marginal-structural-models.html#cb47-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb47-14"><a href="ip-weighting-and-marginal-structural-models.html#cb47-14" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
+<span id="cb47-15"><a href="ip-weighting-and-marginal-structural-models.html#cb47-15" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
+<span id="cb47-16"><a href="ip-weighting-and-marginal-structural-models.html#cb47-16" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb47-17"><a href="ip-weighting-and-marginal-structural-models.html#cb47-17" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv)</span></span>
+<span id="cb47-18"><a href="ip-weighting-and-marginal-structural-models.html#cb47-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb47-19"><a href="ip-weighting-and-marginal-structural-models.html#cb47-19" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb47-20"><a href="ip-weighting-and-marginal-structural-models.html#cb47-20" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb47-21"><a href="ip-weighting-and-marginal-structural-models.html#cb47-21" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.242519   1.380836   -1.62  0.10437    </span></span>
+<span id="cb47-22"><a href="ip-weighting-and-marginal-structural-models.html#cb47-22" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.527478   0.154050   -3.42  0.00062 ***</span></span>
+<span id="cb47-23"><a href="ip-weighting-and-marginal-structural-models.html#cb47-23" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.839264   0.210067   -4.00  6.5e-05 ***</span></span>
+<span id="cb47-24"><a href="ip-weighting-and-marginal-structural-models.html#cb47-24" tabindex="-1"></a><span class="co">#&gt; age                    0.121205   0.051266    2.36  0.01807 *  </span></span>
+<span id="cb47-25"><a href="ip-weighting-and-marginal-structural-models.html#cb47-25" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000825   0.000536   -1.54  0.12404    </span></span>
+<span id="cb47-26"><a href="ip-weighting-and-marginal-structural-models.html#cb47-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.028776   0.198351   -0.15  0.88465    </span></span>
+<span id="cb47-27"><a href="ip-weighting-and-marginal-structural-models.html#cb47-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.086432   0.178085    0.49  0.62744    </span></span>
+<span id="cb47-28"><a href="ip-weighting-and-marginal-structural-models.html#cb47-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.063601   0.273211    0.23  0.81592    </span></span>
+<span id="cb47-29"><a href="ip-weighting-and-marginal-structural-models.html#cb47-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.475961   0.226224    2.10  0.03538 *  </span></span>
+<span id="cb47-30"><a href="ip-weighting-and-marginal-structural-models.html#cb47-30" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.077270   0.015250   -5.07  4.0e-07 ***</span></span>
+<span id="cb47-31"><a href="ip-weighting-and-marginal-structural-models.html#cb47-31" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.001045   0.000287    3.65  0.00027 ***</span></span>
+<span id="cb47-32"><a href="ip-weighting-and-marginal-structural-models.html#cb47-32" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073597   0.027777   -2.65  0.00806 ** </span></span>
+<span id="cb47-33"><a href="ip-weighting-and-marginal-structural-models.html#cb47-33" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000844   0.000463    1.82  0.06840 .  </span></span>
+<span id="cb47-34"><a href="ip-weighting-and-marginal-structural-models.html#cb47-34" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.354841   0.180135    1.97  0.04885 *  </span></span>
+<span id="cb47-35"><a href="ip-weighting-and-marginal-structural-models.html#cb47-35" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.395704   0.187240    2.11  0.03457 *  </span></span>
+<span id="cb47-36"><a href="ip-weighting-and-marginal-structural-models.html#cb47-36" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.031944   0.132937    0.24  0.81010    </span></span>
+<span id="cb47-37"><a href="ip-weighting-and-marginal-structural-models.html#cb47-37" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.176784   0.214972    0.82  0.41087    </span></span>
+<span id="cb47-38"><a href="ip-weighting-and-marginal-structural-models.html#cb47-38" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.015236   0.026316   -0.58  0.56262    </span></span>
+<span id="cb47-39"><a href="ip-weighting-and-marginal-structural-models.html#cb47-39" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000135   0.000163    0.83  0.40737    </span></span>
+<span id="cb47-40"><a href="ip-weighting-and-marginal-structural-models.html#cb47-40" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb47-41"><a href="ip-weighting-and-marginal-structural-models.html#cb47-41" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb47-42"><a href="ip-weighting-and-marginal-structural-models.html#cb47-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb47-43"><a href="ip-weighting-and-marginal-structural-models.html#cb47-43" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb47-44"><a href="ip-weighting-and-marginal-structural-models.html#cb47-44" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb47-45"><a href="ip-weighting-and-marginal-structural-models.html#cb47-45" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb47-46"><a href="ip-weighting-and-marginal-structural-models.html#cb47-46" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
+<span id="cb47-47"><a href="ip-weighting-and-marginal-structural-models.html#cb47-47" tabindex="-1"></a><span class="co">#&gt; AIC: 1715</span></span>
+<span id="cb47-48"><a href="ip-weighting-and-marginal-structural-models.html#cb47-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb47-49"><a href="ip-weighting-and-marginal-structural-models.html#cb47-49" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb48"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb48-1"><a href="ip-weighting-and-marginal-structural-models.html#cb48-1" tabindex="-1"></a></span>
+<span id="cb48-2"><a href="ip-weighting-and-marginal-structural-models.html#cb48-2" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb48-3"><a href="ip-weighting-and-marginal-structural-models.html#cb48-3" tabindex="-1"></a></span>
+<span id="cb48-4"><a href="ip-weighting-and-marginal-structural-models.html#cb48-4" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
+<span id="cb48-5"><a href="ip-weighting-and-marginal-structural-models.html#cb48-5" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs.nmv)</span>
+<span id="cb48-6"><a href="ip-weighting-and-marginal-structural-models.html#cb48-6" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
+<span id="cb48-7"><a href="ip-weighting-and-marginal-structural-models.html#cb48-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb48-8"><a href="ip-weighting-and-marginal-structural-models.html#cb48-8" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb48-9"><a href="ip-weighting-and-marginal-structural-models.html#cb48-9" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs.nmv)</span></span>
+<span id="cb48-10"><a href="ip-weighting-and-marginal-structural-models.html#cb48-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb48-11"><a href="ip-weighting-and-marginal-structural-models.html#cb48-11" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb48-12"><a href="ip-weighting-and-marginal-structural-models.html#cb48-12" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb48-13"><a href="ip-weighting-and-marginal-structural-models.html#cb48-13" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.0598     0.0578   -18.3   &lt;2e-16 ***</span></span>
+<span id="cb48-14"><a href="ip-weighting-and-marginal-structural-models.html#cb48-14" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb48-15"><a href="ip-weighting-and-marginal-structural-models.html#cb48-15" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb48-16"><a href="ip-weighting-and-marginal-structural-models.html#cb48-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb48-17"><a href="ip-weighting-and-marginal-structural-models.html#cb48-17" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb48-18"><a href="ip-weighting-and-marginal-structural-models.html#cb48-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb48-19"><a href="ip-weighting-and-marginal-structural-models.html#cb48-19" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb48-20"><a href="ip-weighting-and-marginal-structural-models.html#cb48-20" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb48-21"><a href="ip-weighting-and-marginal-structural-models.html#cb48-21" tabindex="-1"></a><span class="co">#&gt; AIC: 1788</span></span>
+<span id="cb48-22"><a href="ip-weighting-and-marginal-structural-models.html#cb48-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb48-23"><a href="ip-weighting-and-marginal-structural-models.html#cb48-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb49"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb49-1"><a href="ip-weighting-and-marginal-structural-models.html#cb49-1" tabindex="-1"></a></span>
+<span id="cb49-2"><a href="ip-weighting-and-marginal-structural-models.html#cb49-2" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb49-3"><a href="ip-weighting-and-marginal-structural-models.html#cb49-3" tabindex="-1"></a></span>
+<span id="cb49-4"><a href="ip-weighting-and-marginal-structural-models.html#cb49-4" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>sw <span class="ot">&lt;-</span></span>
+<span id="cb49-5"><a href="ip-weighting-and-marginal-structural-models.html#cb49-5" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
+<span id="cb49-6"><a href="ip-weighting-and-marginal-structural-models.html#cb49-6" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
+<span id="cb49-7"><a href="ip-weighting-and-marginal-structural-models.html#cb49-7" tabindex="-1"></a></span>
+<span id="cb49-8"><a href="ip-weighting-and-marginal-structural-models.html#cb49-8" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>sw)</span>
+<span id="cb49-9"><a href="ip-weighting-and-marginal-structural-models.html#cb49-9" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb49-10"><a href="ip-weighting-and-marginal-structural-models.html#cb49-10" tabindex="-1"></a><span class="co">#&gt;   0.331   0.867   0.950   0.999   1.079   4.298</span></span></code></pre></div>
+<div class="sourceCode" id="cb50"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb50-1"><a href="ip-weighting-and-marginal-structural-models.html#cb50-1" tabindex="-1"></a></span>
+<span id="cb50-2"><a href="ip-weighting-and-marginal-structural-models.html#cb50-2" tabindex="-1"></a></span>
+<span id="cb50-3"><a href="ip-weighting-and-marginal-structural-models.html#cb50-3" tabindex="-1"></a>msm.sw <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
+<span id="cb50-4"><a href="ip-weighting-and-marginal-structural-models.html#cb50-4" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
+<span id="cb50-5"><a href="ip-weighting-and-marginal-structural-models.html#cb50-5" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
+<span id="cb50-6"><a href="ip-weighting-and-marginal-structural-models.html#cb50-6" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
+<span id="cb50-7"><a href="ip-weighting-and-marginal-structural-models.html#cb50-7" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
+<span id="cb50-8"><a href="ip-weighting-and-marginal-structural-models.html#cb50-8" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb50-9"><a href="ip-weighting-and-marginal-structural-models.html#cb50-9" tabindex="-1"></a>)</span>
+<span id="cb50-10"><a href="ip-weighting-and-marginal-structural-models.html#cb50-10" tabindex="-1"></a><span class="fu">summary</span>(msm.sw)</span>
+<span id="cb50-11"><a href="ip-weighting-and-marginal-structural-models.html#cb50-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb50-12"><a href="ip-weighting-and-marginal-structural-models.html#cb50-12" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb50-13"><a href="ip-weighting-and-marginal-structural-models.html#cb50-13" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, </span></span>
+<span id="cb50-14"><a href="ip-weighting-and-marginal-structural-models.html#cb50-14" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb50-15"><a href="ip-weighting-and-marginal-structural-models.html#cb50-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb50-16"><a href="ip-weighting-and-marginal-structural-models.html#cb50-16" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb50-17"><a href="ip-weighting-and-marginal-structural-models.html#cb50-17" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err Wald Pr(&gt;|W|)    </span></span>
+<span id="cb50-18"><a href="ip-weighting-and-marginal-structural-models.html#cb50-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)    1.780   0.225 62.7  2.3e-15 ***</span></span>
+<span id="cb50-19"><a href="ip-weighting-and-marginal-structural-models.html#cb50-19" tabindex="-1"></a><span class="co">#&gt; qsmk           3.441   0.525 42.9  5.9e-11 ***</span></span>
+<span id="cb50-20"><a href="ip-weighting-and-marginal-structural-models.html#cb50-20" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb50-21"><a href="ip-weighting-and-marginal-structural-models.html#cb50-21" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb50-22"><a href="ip-weighting-and-marginal-structural-models.html#cb50-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb50-23"><a href="ip-weighting-and-marginal-structural-models.html#cb50-23" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb50-24"><a href="ip-weighting-and-marginal-structural-models.html#cb50-24" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb50-25"><a href="ip-weighting-and-marginal-structural-models.html#cb50-25" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb50-26"><a href="ip-weighting-and-marginal-structural-models.html#cb50-26" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb50-27"><a href="ip-weighting-and-marginal-structural-models.html#cb50-27" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.7    3.71</span></span>
+<span id="cb50-28"><a href="ip-weighting-and-marginal-structural-models.html#cb50-28" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb51"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb51-1"><a href="ip-weighting-and-marginal-structural-models.html#cb51-1" tabindex="-1"></a></span>
+<span id="cb51-2"><a href="ip-weighting-and-marginal-structural-models.html#cb51-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw)</span>
+<span id="cb51-3"><a href="ip-weighting-and-marginal-structural-models.html#cb51-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw))[, <span class="dv">2</span>]</span>
+<span id="cb51-4"><a href="ip-weighting-and-marginal-structural-models.html#cb51-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb51-5"><a href="ip-weighting-and-marginal-structural-models.html#cb51-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb51-6"><a href="ip-weighting-and-marginal-structural-models.html#cb51-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb51-7"><a href="ip-weighting-and-marginal-structural-models.html#cb51-7" tabindex="-1"></a><span class="co">#&gt;             beta  lcl  ucl</span></span>
+<span id="cb51-8"><a href="ip-weighting-and-marginal-structural-models.html#cb51-8" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.78 1.34 2.22</span></span>
+<span id="cb51-9"><a href="ip-weighting-and-marginal-structural-models.html#cb51-9" tabindex="-1"></a><span class="co">#&gt; qsmk        3.44 2.41 4.47</span></span></code></pre></div>
+<div class="sourceCode" id="cb52"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb52-1"><a href="ip-weighting-and-marginal-structural-models.html#cb52-1" tabindex="-1"></a></span>
+<span id="cb52-2"><a href="ip-weighting-and-marginal-structural-models.html#cb52-2" tabindex="-1"></a><span class="co"># no association between sex and qsmk in pseudo-population</span></span>
+<span id="cb52-3"><a href="ip-weighting-and-marginal-structural-models.html#cb52-3" tabindex="-1"></a><span class="fu">xtabs</span>(nhefs.nmv<span class="sc">$</span>sw <span class="sc">~</span> nhefs.nmv<span class="sc">$</span>sex <span class="sc">+</span> nhefs.nmv<span class="sc">$</span>qsmk)</span>
+<span id="cb52-4"><a href="ip-weighting-and-marginal-structural-models.html#cb52-4" tabindex="-1"></a><span class="co">#&gt;              nhefs.nmv$qsmk</span></span>
+<span id="cb52-5"><a href="ip-weighting-and-marginal-structural-models.html#cb52-5" tabindex="-1"></a><span class="co">#&gt; nhefs.nmv$sex   0   1</span></span>
+<span id="cb52-6"><a href="ip-weighting-and-marginal-structural-models.html#cb52-6" tabindex="-1"></a><span class="co">#&gt;             0 567 197</span></span>
+<span id="cb52-7"><a href="ip-weighting-and-marginal-structural-models.html#cb52-7" tabindex="-1"></a><span class="co">#&gt;             1 595 205</span></span></code></pre></div>
 </div>
 <div id="program-12.4" class="section level2 hasAnchor">
 <h2>Program 12.4<a href="ip-weighting-and-marginal-structural-models.html#program-12.4" class="anchor-section" aria-label="Anchor link to header"></a></h2>
 <ul>
 <li>Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb14"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb14-1"><a href="ip-weighting-and-marginal-structural-models.html#cb14-1" tabindex="-1"></a><span class="co"># Analysis restricted to subjects reporting &lt;=25 cig/day at baseline</span></span>
-<span id="cb14-2"><a href="ip-weighting-and-marginal-structural-models.html#cb14-2" tabindex="-1"></a>nhefs.nmv.s <span class="ot">&lt;-</span> <span class="fu">subset</span>(nhefs.nmv, smokeintensity <span class="sc">&lt;=</span> <span class="dv">25</span>)</span>
-<span id="cb14-3"><a href="ip-weighting-and-marginal-structural-models.html#cb14-3" tabindex="-1"></a></span>
-<span id="cb14-4"><a href="ip-weighting-and-marginal-structural-models.html#cb14-4" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
-<span id="cb14-5"><a href="ip-weighting-and-marginal-structural-models.html#cb14-5" tabindex="-1"></a>den.fit.obj <span class="ot">&lt;-</span> <span class="fu">lm</span>(</span>
-<span id="cb14-6"><a href="ip-weighting-and-marginal-structural-models.html#cb14-6" tabindex="-1"></a>  smkintensity82_71 <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span></span>
-<span id="cb14-7"><a href="ip-weighting-and-marginal-structural-models.html#cb14-7" tabindex="-1"></a>    <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb14-8"><a href="ip-weighting-and-marginal-structural-models.html#cb14-8" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb14-9"><a href="ip-weighting-and-marginal-structural-models.html#cb14-9" tabindex="-1"></a>    smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span></span>
-<span id="cb14-10"><a href="ip-weighting-and-marginal-structural-models.html#cb14-10" tabindex="-1"></a>    <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb14-11"><a href="ip-weighting-and-marginal-structural-models.html#cb14-11" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv.s</span>
-<span id="cb14-12"><a href="ip-weighting-and-marginal-structural-models.html#cb14-12" tabindex="-1"></a>)</span>
-<span id="cb14-13"><a href="ip-weighting-and-marginal-structural-models.html#cb14-13" tabindex="-1"></a>p.den <span class="ot">&lt;-</span> <span class="fu">predict</span>(den.fit.obj, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb14-14"><a href="ip-weighting-and-marginal-structural-models.html#cb14-14" tabindex="-1"></a>dens.den <span class="ot">&lt;-</span></span>
-<span id="cb14-15"><a href="ip-weighting-and-marginal-structural-models.html#cb14-15" tabindex="-1"></a>  <span class="fu">dnorm</span>(nhefs.nmv.s<span class="sc">$</span>smkintensity82_71,</span>
-<span id="cb14-16"><a href="ip-weighting-and-marginal-structural-models.html#cb14-16" tabindex="-1"></a>        p.den,</span>
-<span id="cb14-17"><a href="ip-weighting-and-marginal-structural-models.html#cb14-17" tabindex="-1"></a>        <span class="fu">summary</span>(den.fit.obj)<span class="sc">$</span>sigma)</span>
-<span id="cb14-18"><a href="ip-weighting-and-marginal-structural-models.html#cb14-18" tabindex="-1"></a></span>
-<span id="cb14-19"><a href="ip-weighting-and-marginal-structural-models.html#cb14-19" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
-<span id="cb14-20"><a href="ip-weighting-and-marginal-structural-models.html#cb14-20" tabindex="-1"></a>num.fit.obj <span class="ot">&lt;-</span> <span class="fu">lm</span>(smkintensity82_71 <span class="sc">~</span> <span class="dv">1</span>, <span class="at">data =</span> nhefs.nmv.s)</span>
-<span id="cb14-21"><a href="ip-weighting-and-marginal-structural-models.html#cb14-21" tabindex="-1"></a>p.num <span class="ot">&lt;-</span> <span class="fu">predict</span>(num.fit.obj, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb14-22"><a href="ip-weighting-and-marginal-structural-models.html#cb14-22" tabindex="-1"></a>dens.num <span class="ot">&lt;-</span></span>
-<span id="cb14-23"><a href="ip-weighting-and-marginal-structural-models.html#cb14-23" tabindex="-1"></a>  <span class="fu">dnorm</span>(nhefs.nmv.s<span class="sc">$</span>smkintensity82_71,</span>
-<span id="cb14-24"><a href="ip-weighting-and-marginal-structural-models.html#cb14-24" tabindex="-1"></a>        p.num,</span>
-<span id="cb14-25"><a href="ip-weighting-and-marginal-structural-models.html#cb14-25" tabindex="-1"></a>        <span class="fu">summary</span>(num.fit.obj)<span class="sc">$</span>sigma)</span>
-<span id="cb14-26"><a href="ip-weighting-and-marginal-structural-models.html#cb14-26" tabindex="-1"></a></span>
-<span id="cb14-27"><a href="ip-weighting-and-marginal-structural-models.html#cb14-27" tabindex="-1"></a>nhefs.nmv.s<span class="sc">$</span>sw.a <span class="ot">&lt;-</span> dens.num <span class="sc">/</span> dens.den</span>
-<span id="cb14-28"><a href="ip-weighting-and-marginal-structural-models.html#cb14-28" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv.s<span class="sc">$</span>sw.a)</span>
-<span id="cb14-29"><a href="ip-weighting-and-marginal-structural-models.html#cb14-29" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb14-30"><a href="ip-weighting-and-marginal-structural-models.html#cb14-30" tabindex="-1"></a><span class="co">#&gt;    0.19    0.89    0.97    1.00    1.05    5.10</span></span>
-<span id="cb14-31"><a href="ip-weighting-and-marginal-structural-models.html#cb14-31" tabindex="-1"></a></span>
-<span id="cb14-32"><a href="ip-weighting-and-marginal-structural-models.html#cb14-32" tabindex="-1"></a>msm.sw.cont <span class="ot">&lt;-</span></span>
-<span id="cb14-33"><a href="ip-weighting-and-marginal-structural-models.html#cb14-33" tabindex="-1"></a>  <span class="fu">geeglm</span>(</span>
-<span id="cb14-34"><a href="ip-weighting-and-marginal-structural-models.html#cb14-34" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> smkintensity82_71 <span class="sc">+</span> <span class="fu">I</span>(smkintensity82_71 <span class="sc">*</span> smkintensity82_71),</span>
-<span id="cb14-35"><a href="ip-weighting-and-marginal-structural-models.html#cb14-35" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv.s,</span>
-<span id="cb14-36"><a href="ip-weighting-and-marginal-structural-models.html#cb14-36" tabindex="-1"></a>    <span class="at">weights =</span> sw.a,</span>
-<span id="cb14-37"><a href="ip-weighting-and-marginal-structural-models.html#cb14-37" tabindex="-1"></a>    <span class="at">id =</span> seqn,</span>
-<span id="cb14-38"><a href="ip-weighting-and-marginal-structural-models.html#cb14-38" tabindex="-1"></a>    <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb14-39"><a href="ip-weighting-and-marginal-structural-models.html#cb14-39" tabindex="-1"></a>  )</span>
-<span id="cb14-40"><a href="ip-weighting-and-marginal-structural-models.html#cb14-40" tabindex="-1"></a><span class="fu">summary</span>(msm.sw.cont)</span>
-<span id="cb14-41"><a href="ip-weighting-and-marginal-structural-models.html#cb14-41" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb14-42"><a href="ip-weighting-and-marginal-structural-models.html#cb14-42" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb14-43"><a href="ip-weighting-and-marginal-structural-models.html#cb14-43" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * </span></span>
-<span id="cb14-44"><a href="ip-weighting-and-marginal-structural-models.html#cb14-44" tabindex="-1"></a><span class="co">#&gt;     smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, </span></span>
-<span id="cb14-45"><a href="ip-weighting-and-marginal-structural-models.html#cb14-45" tabindex="-1"></a><span class="co">#&gt;     corstr = &quot;independence&quot;)</span></span>
-<span id="cb14-46"><a href="ip-weighting-and-marginal-structural-models.html#cb14-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb14-47"><a href="ip-weighting-and-marginal-structural-models.html#cb14-47" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb14-48"><a href="ip-weighting-and-marginal-structural-models.html#cb14-48" tabindex="-1"></a><span class="co">#&gt;                                          Estimate  Std.err  Wald Pr(&gt;|W|)    </span></span>
-<span id="cb14-49"><a href="ip-weighting-and-marginal-structural-models.html#cb14-49" tabindex="-1"></a><span class="co">#&gt; (Intercept)                               2.00452  0.29512 46.13  1.1e-11 ***</span></span>
-<span id="cb14-50"><a href="ip-weighting-and-marginal-structural-models.html#cb14-50" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                        -0.10899  0.03154 11.94  0.00055 ***</span></span>
-<span id="cb14-51"><a href="ip-weighting-and-marginal-structural-models.html#cb14-51" tabindex="-1"></a><span class="co">#&gt; I(smkintensity82_71 * smkintensity82_71)  0.00269  0.00242  1.24  0.26489    </span></span>
-<span id="cb14-52"><a href="ip-weighting-and-marginal-structural-models.html#cb14-52" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb14-53"><a href="ip-weighting-and-marginal-structural-models.html#cb14-53" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb14-54"><a href="ip-weighting-and-marginal-structural-models.html#cb14-54" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb14-55"><a href="ip-weighting-and-marginal-structural-models.html#cb14-55" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb14-56"><a href="ip-weighting-and-marginal-structural-models.html#cb14-56" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb14-57"><a href="ip-weighting-and-marginal-structural-models.html#cb14-57" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb14-58"><a href="ip-weighting-and-marginal-structural-models.html#cb14-58" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb14-59"><a href="ip-weighting-and-marginal-structural-models.html#cb14-59" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.5     4.5</span></span>
-<span id="cb14-60"><a href="ip-weighting-and-marginal-structural-models.html#cb14-60" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1162  Maximum cluster size: 1</span></span>
-<span id="cb14-61"><a href="ip-weighting-and-marginal-structural-models.html#cb14-61" tabindex="-1"></a></span>
-<span id="cb14-62"><a href="ip-weighting-and-marginal-structural-models.html#cb14-62" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw.cont)</span>
-<span id="cb14-63"><a href="ip-weighting-and-marginal-structural-models.html#cb14-63" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw.cont))[, <span class="dv">2</span>]</span>
-<span id="cb14-64"><a href="ip-weighting-and-marginal-structural-models.html#cb14-64" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb14-65"><a href="ip-weighting-and-marginal-structural-models.html#cb14-65" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb14-66"><a href="ip-weighting-and-marginal-structural-models.html#cb14-66" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb14-67"><a href="ip-weighting-and-marginal-structural-models.html#cb14-67" tabindex="-1"></a><span class="co">#&gt;                                              beta      lcl      ucl</span></span>
-<span id="cb14-68"><a href="ip-weighting-and-marginal-structural-models.html#cb14-68" tabindex="-1"></a><span class="co">#&gt; (Intercept)                               2.00452  1.42610  2.58295</span></span>
-<span id="cb14-69"><a href="ip-weighting-and-marginal-structural-models.html#cb14-69" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                        -0.10899 -0.17080 -0.04718</span></span>
-<span id="cb14-70"><a href="ip-weighting-and-marginal-structural-models.html#cb14-70" tabindex="-1"></a><span class="co">#&gt; I(smkintensity82_71 * smkintensity82_71)  0.00269 -0.00204  0.00743</span></span></code></pre></div>
+<div class="sourceCode" id="cb53"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb53-1"><a href="ip-weighting-and-marginal-structural-models.html#cb53-1" tabindex="-1"></a><span class="co"># Analysis restricted to subjects reporting &lt;=25 cig/day at baseline</span></span>
+<span id="cb53-2"><a href="ip-weighting-and-marginal-structural-models.html#cb53-2" tabindex="-1"></a>nhefs.nmv.s <span class="ot">&lt;-</span> <span class="fu">subset</span>(nhefs.nmv, smokeintensity <span class="sc">&lt;=</span> <span class="dv">25</span>)</span>
+<span id="cb53-3"><a href="ip-weighting-and-marginal-structural-models.html#cb53-3" tabindex="-1"></a></span>
+<span id="cb53-4"><a href="ip-weighting-and-marginal-structural-models.html#cb53-4" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
+<span id="cb53-5"><a href="ip-weighting-and-marginal-structural-models.html#cb53-5" tabindex="-1"></a>den.fit.obj <span class="ot">&lt;-</span> <span class="fu">lm</span>(</span>
+<span id="cb53-6"><a href="ip-weighting-and-marginal-structural-models.html#cb53-6" tabindex="-1"></a>  smkintensity82_71 <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span></span>
+<span id="cb53-7"><a href="ip-weighting-and-marginal-structural-models.html#cb53-7" tabindex="-1"></a>    <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb53-8"><a href="ip-weighting-and-marginal-structural-models.html#cb53-8" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb53-9"><a href="ip-weighting-and-marginal-structural-models.html#cb53-9" tabindex="-1"></a>    smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span></span>
+<span id="cb53-10"><a href="ip-weighting-and-marginal-structural-models.html#cb53-10" tabindex="-1"></a>    <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb53-11"><a href="ip-weighting-and-marginal-structural-models.html#cb53-11" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv.s</span>
+<span id="cb53-12"><a href="ip-weighting-and-marginal-structural-models.html#cb53-12" tabindex="-1"></a>)</span>
+<span id="cb53-13"><a href="ip-weighting-and-marginal-structural-models.html#cb53-13" tabindex="-1"></a>p.den <span class="ot">&lt;-</span> <span class="fu">predict</span>(den.fit.obj, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb53-14"><a href="ip-weighting-and-marginal-structural-models.html#cb53-14" tabindex="-1"></a>dens.den <span class="ot">&lt;-</span></span>
+<span id="cb53-15"><a href="ip-weighting-and-marginal-structural-models.html#cb53-15" tabindex="-1"></a>  <span class="fu">dnorm</span>(nhefs.nmv.s<span class="sc">$</span>smkintensity82_71,</span>
+<span id="cb53-16"><a href="ip-weighting-and-marginal-structural-models.html#cb53-16" tabindex="-1"></a>        p.den,</span>
+<span id="cb53-17"><a href="ip-weighting-and-marginal-structural-models.html#cb53-17" tabindex="-1"></a>        <span class="fu">summary</span>(den.fit.obj)<span class="sc">$</span>sigma)</span>
+<span id="cb53-18"><a href="ip-weighting-and-marginal-structural-models.html#cb53-18" tabindex="-1"></a></span>
+<span id="cb53-19"><a href="ip-weighting-and-marginal-structural-models.html#cb53-19" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
+<span id="cb53-20"><a href="ip-weighting-and-marginal-structural-models.html#cb53-20" tabindex="-1"></a>num.fit.obj <span class="ot">&lt;-</span> <span class="fu">lm</span>(smkintensity82_71 <span class="sc">~</span> <span class="dv">1</span>, <span class="at">data =</span> nhefs.nmv.s)</span>
+<span id="cb53-21"><a href="ip-weighting-and-marginal-structural-models.html#cb53-21" tabindex="-1"></a>p.num <span class="ot">&lt;-</span> <span class="fu">predict</span>(num.fit.obj, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb53-22"><a href="ip-weighting-and-marginal-structural-models.html#cb53-22" tabindex="-1"></a>dens.num <span class="ot">&lt;-</span></span>
+<span id="cb53-23"><a href="ip-weighting-and-marginal-structural-models.html#cb53-23" tabindex="-1"></a>  <span class="fu">dnorm</span>(nhefs.nmv.s<span class="sc">$</span>smkintensity82_71,</span>
+<span id="cb53-24"><a href="ip-weighting-and-marginal-structural-models.html#cb53-24" tabindex="-1"></a>        p.num,</span>
+<span id="cb53-25"><a href="ip-weighting-and-marginal-structural-models.html#cb53-25" tabindex="-1"></a>        <span class="fu">summary</span>(num.fit.obj)<span class="sc">$</span>sigma)</span>
+<span id="cb53-26"><a href="ip-weighting-and-marginal-structural-models.html#cb53-26" tabindex="-1"></a></span>
+<span id="cb53-27"><a href="ip-weighting-and-marginal-structural-models.html#cb53-27" tabindex="-1"></a>nhefs.nmv.s<span class="sc">$</span>sw.a <span class="ot">&lt;-</span> dens.num <span class="sc">/</span> dens.den</span>
+<span id="cb53-28"><a href="ip-weighting-and-marginal-structural-models.html#cb53-28" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv.s<span class="sc">$</span>sw.a)</span>
+<span id="cb53-29"><a href="ip-weighting-and-marginal-structural-models.html#cb53-29" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb53-30"><a href="ip-weighting-and-marginal-structural-models.html#cb53-30" tabindex="-1"></a><span class="co">#&gt;    0.19    0.89    0.97    1.00    1.05    5.10</span></span></code></pre></div>
+<div class="sourceCode" id="cb54"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb54-1"><a href="ip-weighting-and-marginal-structural-models.html#cb54-1" tabindex="-1"></a></span>
+<span id="cb54-2"><a href="ip-weighting-and-marginal-structural-models.html#cb54-2" tabindex="-1"></a>msm.sw.cont <span class="ot">&lt;-</span></span>
+<span id="cb54-3"><a href="ip-weighting-and-marginal-structural-models.html#cb54-3" tabindex="-1"></a>  <span class="fu">geeglm</span>(</span>
+<span id="cb54-4"><a href="ip-weighting-and-marginal-structural-models.html#cb54-4" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> smkintensity82_71 <span class="sc">+</span> <span class="fu">I</span>(smkintensity82_71 <span class="sc">*</span> smkintensity82_71),</span>
+<span id="cb54-5"><a href="ip-weighting-and-marginal-structural-models.html#cb54-5" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv.s,</span>
+<span id="cb54-6"><a href="ip-weighting-and-marginal-structural-models.html#cb54-6" tabindex="-1"></a>    <span class="at">weights =</span> sw.a,</span>
+<span id="cb54-7"><a href="ip-weighting-and-marginal-structural-models.html#cb54-7" tabindex="-1"></a>    <span class="at">id =</span> seqn,</span>
+<span id="cb54-8"><a href="ip-weighting-and-marginal-structural-models.html#cb54-8" tabindex="-1"></a>    <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb54-9"><a href="ip-weighting-and-marginal-structural-models.html#cb54-9" tabindex="-1"></a>  )</span>
+<span id="cb54-10"><a href="ip-weighting-and-marginal-structural-models.html#cb54-10" tabindex="-1"></a><span class="fu">summary</span>(msm.sw.cont)</span>
+<span id="cb54-11"><a href="ip-weighting-and-marginal-structural-models.html#cb54-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb54-12"><a href="ip-weighting-and-marginal-structural-models.html#cb54-12" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb54-13"><a href="ip-weighting-and-marginal-structural-models.html#cb54-13" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * </span></span>
+<span id="cb54-14"><a href="ip-weighting-and-marginal-structural-models.html#cb54-14" tabindex="-1"></a><span class="co">#&gt;     smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, </span></span>
+<span id="cb54-15"><a href="ip-weighting-and-marginal-structural-models.html#cb54-15" tabindex="-1"></a><span class="co">#&gt;     corstr = &quot;independence&quot;)</span></span>
+<span id="cb54-16"><a href="ip-weighting-and-marginal-structural-models.html#cb54-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb54-17"><a href="ip-weighting-and-marginal-structural-models.html#cb54-17" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb54-18"><a href="ip-weighting-and-marginal-structural-models.html#cb54-18" tabindex="-1"></a><span class="co">#&gt;                                          Estimate  Std.err  Wald Pr(&gt;|W|)    </span></span>
+<span id="cb54-19"><a href="ip-weighting-and-marginal-structural-models.html#cb54-19" tabindex="-1"></a><span class="co">#&gt; (Intercept)                               2.00452  0.29512 46.13  1.1e-11 ***</span></span>
+<span id="cb54-20"><a href="ip-weighting-and-marginal-structural-models.html#cb54-20" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                        -0.10899  0.03154 11.94  0.00055 ***</span></span>
+<span id="cb54-21"><a href="ip-weighting-and-marginal-structural-models.html#cb54-21" tabindex="-1"></a><span class="co">#&gt; I(smkintensity82_71 * smkintensity82_71)  0.00269  0.00242  1.24  0.26489    </span></span>
+<span id="cb54-22"><a href="ip-weighting-and-marginal-structural-models.html#cb54-22" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb54-23"><a href="ip-weighting-and-marginal-structural-models.html#cb54-23" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb54-24"><a href="ip-weighting-and-marginal-structural-models.html#cb54-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb54-25"><a href="ip-weighting-and-marginal-structural-models.html#cb54-25" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb54-26"><a href="ip-weighting-and-marginal-structural-models.html#cb54-26" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb54-27"><a href="ip-weighting-and-marginal-structural-models.html#cb54-27" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb54-28"><a href="ip-weighting-and-marginal-structural-models.html#cb54-28" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb54-29"><a href="ip-weighting-and-marginal-structural-models.html#cb54-29" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.5     4.5</span></span>
+<span id="cb54-30"><a href="ip-weighting-and-marginal-structural-models.html#cb54-30" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1162  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb55"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb55-1"><a href="ip-weighting-and-marginal-structural-models.html#cb55-1" tabindex="-1"></a></span>
+<span id="cb55-2"><a href="ip-weighting-and-marginal-structural-models.html#cb55-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw.cont)</span>
+<span id="cb55-3"><a href="ip-weighting-and-marginal-structural-models.html#cb55-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw.cont))[, <span class="dv">2</span>]</span>
+<span id="cb55-4"><a href="ip-weighting-and-marginal-structural-models.html#cb55-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb55-5"><a href="ip-weighting-and-marginal-structural-models.html#cb55-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb55-6"><a href="ip-weighting-and-marginal-structural-models.html#cb55-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb55-7"><a href="ip-weighting-and-marginal-structural-models.html#cb55-7" tabindex="-1"></a><span class="co">#&gt;                                              beta      lcl      ucl</span></span>
+<span id="cb55-8"><a href="ip-weighting-and-marginal-structural-models.html#cb55-8" tabindex="-1"></a><span class="co">#&gt; (Intercept)                               2.00452  1.42610  2.58295</span></span>
+<span id="cb55-9"><a href="ip-weighting-and-marginal-structural-models.html#cb55-9" tabindex="-1"></a><span class="co">#&gt; smkintensity82_71                        -0.10899 -0.17080 -0.04718</span></span>
+<span id="cb55-10"><a href="ip-weighting-and-marginal-structural-models.html#cb55-10" tabindex="-1"></a><span class="co">#&gt; I(smkintensity82_71 * smkintensity82_71)  0.00269 -0.00204  0.00743</span></span></code></pre></div>
 </div>
 <div id="program-12.5" class="section level2 hasAnchor">
 <h2>Program 12.5<a href="ip-weighting-and-marginal-structural-models.html#program-12.5" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -806,51 +806,51 @@ <h2>Program 12.5<a href="ip-weighting-and-marginal-structural-models.html#progra
 <li>Estimating the parameters of a marginal structural logistic model</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb15"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb15-1"><a href="ip-weighting-and-marginal-structural-models.html#cb15-1" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>death)</span>
-<span id="cb15-2"><a href="ip-weighting-and-marginal-structural-models.html#cb15-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb15-3"><a href="ip-weighting-and-marginal-structural-models.html#cb15-3" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
-<span id="cb15-4"><a href="ip-weighting-and-marginal-structural-models.html#cb15-4" tabindex="-1"></a><span class="co">#&gt;   0 963 200</span></span>
-<span id="cb15-5"><a href="ip-weighting-and-marginal-structural-models.html#cb15-5" tabindex="-1"></a><span class="co">#&gt;   1 312  91</span></span>
-<span id="cb15-6"><a href="ip-weighting-and-marginal-structural-models.html#cb15-6" tabindex="-1"></a></span>
-<span id="cb15-7"><a href="ip-weighting-and-marginal-structural-models.html#cb15-7" tabindex="-1"></a><span class="co"># First, estimation of stabilized weights sw (same as in Program 12.3)</span></span>
-<span id="cb15-8"><a href="ip-weighting-and-marginal-structural-models.html#cb15-8" tabindex="-1"></a><span class="co"># Second, fit logistic model below</span></span>
-<span id="cb15-9"><a href="ip-weighting-and-marginal-structural-models.html#cb15-9" tabindex="-1"></a>msm.logistic <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
-<span id="cb15-10"><a href="ip-weighting-and-marginal-structural-models.html#cb15-10" tabindex="-1"></a>  death <span class="sc">~</span> qsmk,</span>
-<span id="cb15-11"><a href="ip-weighting-and-marginal-structural-models.html#cb15-11" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
-<span id="cb15-12"><a href="ip-weighting-and-marginal-structural-models.html#cb15-12" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
-<span id="cb15-13"><a href="ip-weighting-and-marginal-structural-models.html#cb15-13" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
-<span id="cb15-14"><a href="ip-weighting-and-marginal-structural-models.html#cb15-14" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb15-15"><a href="ip-weighting-and-marginal-structural-models.html#cb15-15" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb15-16"><a href="ip-weighting-and-marginal-structural-models.html#cb15-16" tabindex="-1"></a>)</span>
-<span id="cb15-17"><a href="ip-weighting-and-marginal-structural-models.html#cb15-17" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span>
-<span id="cb15-18"><a href="ip-weighting-and-marginal-structural-models.html#cb15-18" tabindex="-1"></a><span class="fu">summary</span>(msm.logistic)</span>
-<span id="cb15-19"><a href="ip-weighting-and-marginal-structural-models.html#cb15-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb15-20"><a href="ip-weighting-and-marginal-structural-models.html#cb15-20" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb15-21"><a href="ip-weighting-and-marginal-structural-models.html#cb15-21" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = death ~ qsmk, family = binomial(), data = nhefs.nmv, </span></span>
-<span id="cb15-22"><a href="ip-weighting-and-marginal-structural-models.html#cb15-22" tabindex="-1"></a><span class="co">#&gt;     weights = sw, id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb15-23"><a href="ip-weighting-and-marginal-structural-models.html#cb15-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb15-24"><a href="ip-weighting-and-marginal-structural-models.html#cb15-24" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb15-25"><a href="ip-weighting-and-marginal-structural-models.html#cb15-25" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err   Wald Pr(&gt;|W|)    </span></span>
-<span id="cb15-26"><a href="ip-weighting-and-marginal-structural-models.html#cb15-26" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.4905  0.0789 356.50   &lt;2e-16 ***</span></span>
-<span id="cb15-27"><a href="ip-weighting-and-marginal-structural-models.html#cb15-27" tabindex="-1"></a><span class="co">#&gt; qsmk          0.0301  0.1573   0.04     0.85    </span></span>
-<span id="cb15-28"><a href="ip-weighting-and-marginal-structural-models.html#cb15-28" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb15-29"><a href="ip-weighting-and-marginal-structural-models.html#cb15-29" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb15-30"><a href="ip-weighting-and-marginal-structural-models.html#cb15-30" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb15-31"><a href="ip-weighting-and-marginal-structural-models.html#cb15-31" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb15-32"><a href="ip-weighting-and-marginal-structural-models.html#cb15-32" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb15-33"><a href="ip-weighting-and-marginal-structural-models.html#cb15-33" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb15-34"><a href="ip-weighting-and-marginal-structural-models.html#cb15-34" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb15-35"><a href="ip-weighting-and-marginal-structural-models.html#cb15-35" tabindex="-1"></a><span class="co">#&gt; (Intercept)        1  0.0678</span></span>
-<span id="cb15-36"><a href="ip-weighting-and-marginal-structural-models.html#cb15-36" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span>
-<span id="cb15-37"><a href="ip-weighting-and-marginal-structural-models.html#cb15-37" tabindex="-1"></a></span>
-<span id="cb15-38"><a href="ip-weighting-and-marginal-structural-models.html#cb15-38" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.logistic)</span>
-<span id="cb15-39"><a href="ip-weighting-and-marginal-structural-models.html#cb15-39" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.logistic))[, <span class="dv">2</span>]</span>
-<span id="cb15-40"><a href="ip-weighting-and-marginal-structural-models.html#cb15-40" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb15-41"><a href="ip-weighting-and-marginal-structural-models.html#cb15-41" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb15-42"><a href="ip-weighting-and-marginal-structural-models.html#cb15-42" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb15-43"><a href="ip-weighting-and-marginal-structural-models.html#cb15-43" tabindex="-1"></a><span class="co">#&gt;                beta    lcl    ucl</span></span>
-<span id="cb15-44"><a href="ip-weighting-and-marginal-structural-models.html#cb15-44" tabindex="-1"></a><span class="co">#&gt; (Intercept) -1.4905 -1.645 -1.336</span></span>
-<span id="cb15-45"><a href="ip-weighting-and-marginal-structural-models.html#cb15-45" tabindex="-1"></a><span class="co">#&gt; qsmk         0.0301 -0.278  0.338</span></span></code></pre></div>
+<div class="sourceCode" id="cb56"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb56-1"><a href="ip-weighting-and-marginal-structural-models.html#cb56-1" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>qsmk, nhefs.nmv<span class="sc">$</span>death)</span>
+<span id="cb56-2"><a href="ip-weighting-and-marginal-structural-models.html#cb56-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb56-3"><a href="ip-weighting-and-marginal-structural-models.html#cb56-3" tabindex="-1"></a><span class="co">#&gt;       0   1</span></span>
+<span id="cb56-4"><a href="ip-weighting-and-marginal-structural-models.html#cb56-4" tabindex="-1"></a><span class="co">#&gt;   0 963 200</span></span>
+<span id="cb56-5"><a href="ip-weighting-and-marginal-structural-models.html#cb56-5" tabindex="-1"></a><span class="co">#&gt;   1 312  91</span></span></code></pre></div>
+<div class="sourceCode" id="cb57"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb57-1"><a href="ip-weighting-and-marginal-structural-models.html#cb57-1" tabindex="-1"></a></span>
+<span id="cb57-2"><a href="ip-weighting-and-marginal-structural-models.html#cb57-2" tabindex="-1"></a><span class="co"># First, estimation of stabilized weights sw (same as in Program 12.3)</span></span>
+<span id="cb57-3"><a href="ip-weighting-and-marginal-structural-models.html#cb57-3" tabindex="-1"></a><span class="co"># Second, fit logistic model below</span></span>
+<span id="cb57-4"><a href="ip-weighting-and-marginal-structural-models.html#cb57-4" tabindex="-1"></a>msm.logistic <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
+<span id="cb57-5"><a href="ip-weighting-and-marginal-structural-models.html#cb57-5" tabindex="-1"></a>  death <span class="sc">~</span> qsmk,</span>
+<span id="cb57-6"><a href="ip-weighting-and-marginal-structural-models.html#cb57-6" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
+<span id="cb57-7"><a href="ip-weighting-and-marginal-structural-models.html#cb57-7" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
+<span id="cb57-8"><a href="ip-weighting-and-marginal-structural-models.html#cb57-8" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
+<span id="cb57-9"><a href="ip-weighting-and-marginal-structural-models.html#cb57-9" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb57-10"><a href="ip-weighting-and-marginal-structural-models.html#cb57-10" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb57-11"><a href="ip-weighting-and-marginal-structural-models.html#cb57-11" tabindex="-1"></a>)</span>
+<span id="cb57-12"><a href="ip-weighting-and-marginal-structural-models.html#cb57-12" tabindex="-1"></a><span class="co">#&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm!</span></span></code></pre></div>
+<div class="sourceCode" id="cb58"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb58-1"><a href="ip-weighting-and-marginal-structural-models.html#cb58-1" tabindex="-1"></a><span class="fu">summary</span>(msm.logistic)</span>
+<span id="cb58-2"><a href="ip-weighting-and-marginal-structural-models.html#cb58-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb58-3"><a href="ip-weighting-and-marginal-structural-models.html#cb58-3" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb58-4"><a href="ip-weighting-and-marginal-structural-models.html#cb58-4" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = death ~ qsmk, family = binomial(), data = nhefs.nmv, </span></span>
+<span id="cb58-5"><a href="ip-weighting-and-marginal-structural-models.html#cb58-5" tabindex="-1"></a><span class="co">#&gt;     weights = sw, id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb58-6"><a href="ip-weighting-and-marginal-structural-models.html#cb58-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb58-7"><a href="ip-weighting-and-marginal-structural-models.html#cb58-7" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb58-8"><a href="ip-weighting-and-marginal-structural-models.html#cb58-8" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err   Wald Pr(&gt;|W|)    </span></span>
+<span id="cb58-9"><a href="ip-weighting-and-marginal-structural-models.html#cb58-9" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.4905  0.0789 356.50   &lt;2e-16 ***</span></span>
+<span id="cb58-10"><a href="ip-weighting-and-marginal-structural-models.html#cb58-10" tabindex="-1"></a><span class="co">#&gt; qsmk          0.0301  0.1573   0.04     0.85    </span></span>
+<span id="cb58-11"><a href="ip-weighting-and-marginal-structural-models.html#cb58-11" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb58-12"><a href="ip-weighting-and-marginal-structural-models.html#cb58-12" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb58-13"><a href="ip-weighting-and-marginal-structural-models.html#cb58-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb58-14"><a href="ip-weighting-and-marginal-structural-models.html#cb58-14" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb58-15"><a href="ip-weighting-and-marginal-structural-models.html#cb58-15" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb58-16"><a href="ip-weighting-and-marginal-structural-models.html#cb58-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb58-17"><a href="ip-weighting-and-marginal-structural-models.html#cb58-17" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb58-18"><a href="ip-weighting-and-marginal-structural-models.html#cb58-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)        1  0.0678</span></span>
+<span id="cb58-19"><a href="ip-weighting-and-marginal-structural-models.html#cb58-19" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb59"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb59-1"><a href="ip-weighting-and-marginal-structural-models.html#cb59-1" tabindex="-1"></a></span>
+<span id="cb59-2"><a href="ip-weighting-and-marginal-structural-models.html#cb59-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.logistic)</span>
+<span id="cb59-3"><a href="ip-weighting-and-marginal-structural-models.html#cb59-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.logistic))[, <span class="dv">2</span>]</span>
+<span id="cb59-4"><a href="ip-weighting-and-marginal-structural-models.html#cb59-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb59-5"><a href="ip-weighting-and-marginal-structural-models.html#cb59-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb59-6"><a href="ip-weighting-and-marginal-structural-models.html#cb59-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb59-7"><a href="ip-weighting-and-marginal-structural-models.html#cb59-7" tabindex="-1"></a><span class="co">#&gt;                beta    lcl    ucl</span></span>
+<span id="cb59-8"><a href="ip-weighting-and-marginal-structural-models.html#cb59-8" tabindex="-1"></a><span class="co">#&gt; (Intercept) -1.4905 -1.645 -1.336</span></span>
+<span id="cb59-9"><a href="ip-weighting-and-marginal-structural-models.html#cb59-9" tabindex="-1"></a><span class="co">#&gt; qsmk         0.0301 -0.278  0.338</span></span></code></pre></div>
 </div>
 <div id="program-12.6" class="section level2 hasAnchor">
 <h2>Program 12.6<a href="ip-weighting-and-marginal-structural-models.html#program-12.6" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -858,139 +858,139 @@ <h2>Program 12.6<a href="ip-weighting-and-marginal-structural-models.html#progra
 <li>Assessing effect modification by sex using a marginal structural mean model</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb16"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb16-1"><a href="ip-weighting-and-marginal-structural-models.html#cb16-1" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>sex)</span>
-<span id="cb16-2"><a href="ip-weighting-and-marginal-structural-models.html#cb16-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-3"><a href="ip-weighting-and-marginal-structural-models.html#cb16-3" tabindex="-1"></a><span class="co">#&gt;   0   1 </span></span>
-<span id="cb16-4"><a href="ip-weighting-and-marginal-structural-models.html#cb16-4" tabindex="-1"></a><span class="co">#&gt; 762 804</span></span>
-<span id="cb16-5"><a href="ip-weighting-and-marginal-structural-models.html#cb16-5" tabindex="-1"></a></span>
-<span id="cb16-6"><a href="ip-weighting-and-marginal-structural-models.html#cb16-6" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
-<span id="cb16-7"><a href="ip-weighting-and-marginal-structural-models.html#cb16-7" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
-<span id="cb16-8"><a href="ip-weighting-and-marginal-structural-models.html#cb16-8" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
-<span id="cb16-9"><a href="ip-weighting-and-marginal-structural-models.html#cb16-9" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb16-10"><a href="ip-weighting-and-marginal-structural-models.html#cb16-10" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb16-11"><a href="ip-weighting-and-marginal-structural-models.html#cb16-11" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb16-12"><a href="ip-weighting-and-marginal-structural-models.html#cb16-12" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb16-13"><a href="ip-weighting-and-marginal-structural-models.html#cb16-13" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb16-14"><a href="ip-weighting-and-marginal-structural-models.html#cb16-14" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv</span>
-<span id="cb16-15"><a href="ip-weighting-and-marginal-structural-models.html#cb16-15" tabindex="-1"></a>  )</span>
-<span id="cb16-16"><a href="ip-weighting-and-marginal-structural-models.html#cb16-16" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
-<span id="cb16-17"><a href="ip-weighting-and-marginal-structural-models.html#cb16-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-18"><a href="ip-weighting-and-marginal-structural-models.html#cb16-18" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb16-19"><a href="ip-weighting-and-marginal-structural-models.html#cb16-19" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
-<span id="cb16-20"><a href="ip-weighting-and-marginal-structural-models.html#cb16-20" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
-<span id="cb16-21"><a href="ip-weighting-and-marginal-structural-models.html#cb16-21" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb16-22"><a href="ip-weighting-and-marginal-structural-models.html#cb16-22" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv)</span></span>
-<span id="cb16-23"><a href="ip-weighting-and-marginal-structural-models.html#cb16-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-24"><a href="ip-weighting-and-marginal-structural-models.html#cb16-24" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb16-25"><a href="ip-weighting-and-marginal-structural-models.html#cb16-25" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb16-26"><a href="ip-weighting-and-marginal-structural-models.html#cb16-26" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.242519   1.380836   -1.62  0.10437    </span></span>
-<span id="cb16-27"><a href="ip-weighting-and-marginal-structural-models.html#cb16-27" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.527478   0.154050   -3.42  0.00062 ***</span></span>
-<span id="cb16-28"><a href="ip-weighting-and-marginal-structural-models.html#cb16-28" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.839264   0.210067   -4.00  6.5e-05 ***</span></span>
-<span id="cb16-29"><a href="ip-weighting-and-marginal-structural-models.html#cb16-29" tabindex="-1"></a><span class="co">#&gt; age                    0.121205   0.051266    2.36  0.01807 *  </span></span>
-<span id="cb16-30"><a href="ip-weighting-and-marginal-structural-models.html#cb16-30" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000825   0.000536   -1.54  0.12404    </span></span>
-<span id="cb16-31"><a href="ip-weighting-and-marginal-structural-models.html#cb16-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.028776   0.198351   -0.15  0.88465    </span></span>
-<span id="cb16-32"><a href="ip-weighting-and-marginal-structural-models.html#cb16-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.086432   0.178085    0.49  0.62744    </span></span>
-<span id="cb16-33"><a href="ip-weighting-and-marginal-structural-models.html#cb16-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.063601   0.273211    0.23  0.81592    </span></span>
-<span id="cb16-34"><a href="ip-weighting-and-marginal-structural-models.html#cb16-34" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.475961   0.226224    2.10  0.03538 *  </span></span>
-<span id="cb16-35"><a href="ip-weighting-and-marginal-structural-models.html#cb16-35" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.077270   0.015250   -5.07  4.0e-07 ***</span></span>
-<span id="cb16-36"><a href="ip-weighting-and-marginal-structural-models.html#cb16-36" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.001045   0.000287    3.65  0.00027 ***</span></span>
-<span id="cb16-37"><a href="ip-weighting-and-marginal-structural-models.html#cb16-37" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073597   0.027777   -2.65  0.00806 ** </span></span>
-<span id="cb16-38"><a href="ip-weighting-and-marginal-structural-models.html#cb16-38" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000844   0.000463    1.82  0.06840 .  </span></span>
-<span id="cb16-39"><a href="ip-weighting-and-marginal-structural-models.html#cb16-39" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.354841   0.180135    1.97  0.04885 *  </span></span>
-<span id="cb16-40"><a href="ip-weighting-and-marginal-structural-models.html#cb16-40" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.395704   0.187240    2.11  0.03457 *  </span></span>
-<span id="cb16-41"><a href="ip-weighting-and-marginal-structural-models.html#cb16-41" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.031944   0.132937    0.24  0.81010    </span></span>
-<span id="cb16-42"><a href="ip-weighting-and-marginal-structural-models.html#cb16-42" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.176784   0.214972    0.82  0.41087    </span></span>
-<span id="cb16-43"><a href="ip-weighting-and-marginal-structural-models.html#cb16-43" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.015236   0.026316   -0.58  0.56262    </span></span>
-<span id="cb16-44"><a href="ip-weighting-and-marginal-structural-models.html#cb16-44" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000135   0.000163    0.83  0.40737    </span></span>
-<span id="cb16-45"><a href="ip-weighting-and-marginal-structural-models.html#cb16-45" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb16-46"><a href="ip-weighting-and-marginal-structural-models.html#cb16-46" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb16-47"><a href="ip-weighting-and-marginal-structural-models.html#cb16-47" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-48"><a href="ip-weighting-and-marginal-structural-models.html#cb16-48" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb16-49"><a href="ip-weighting-and-marginal-structural-models.html#cb16-49" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-50"><a href="ip-weighting-and-marginal-structural-models.html#cb16-50" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb16-51"><a href="ip-weighting-and-marginal-structural-models.html#cb16-51" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
-<span id="cb16-52"><a href="ip-weighting-and-marginal-structural-models.html#cb16-52" tabindex="-1"></a><span class="co">#&gt; AIC: 1715</span></span>
-<span id="cb16-53"><a href="ip-weighting-and-marginal-structural-models.html#cb16-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-54"><a href="ip-weighting-and-marginal-structural-models.html#cb16-54" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb16-55"><a href="ip-weighting-and-marginal-structural-models.html#cb16-55" tabindex="-1"></a></span>
-<span id="cb16-56"><a href="ip-weighting-and-marginal-structural-models.html#cb16-56" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb16-57"><a href="ip-weighting-and-marginal-structural-models.html#cb16-57" tabindex="-1"></a></span>
-<span id="cb16-58"><a href="ip-weighting-and-marginal-structural-models.html#cb16-58" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
-<span id="cb16-59"><a href="ip-weighting-and-marginal-structural-models.html#cb16-59" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span></span>
-<span id="cb16-60"><a href="ip-weighting-and-marginal-structural-models.html#cb16-60" tabindex="-1"></a>  <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex), <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs.nmv)</span>
-<span id="cb16-61"><a href="ip-weighting-and-marginal-structural-models.html#cb16-61" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
-<span id="cb16-62"><a href="ip-weighting-and-marginal-structural-models.html#cb16-62" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-63"><a href="ip-weighting-and-marginal-structural-models.html#cb16-63" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb16-64"><a href="ip-weighting-and-marginal-structural-models.html#cb16-64" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv)</span></span>
-<span id="cb16-65"><a href="ip-weighting-and-marginal-structural-models.html#cb16-65" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-66"><a href="ip-weighting-and-marginal-structural-models.html#cb16-66" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb16-67"><a href="ip-weighting-and-marginal-structural-models.html#cb16-67" tabindex="-1"></a><span class="co">#&gt;                 Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb16-68"><a href="ip-weighting-and-marginal-structural-models.html#cb16-68" tabindex="-1"></a><span class="co">#&gt; (Intercept)      -0.9016     0.0799  -11.28   &lt;2e-16 ***</span></span>
-<span id="cb16-69"><a href="ip-weighting-and-marginal-structural-models.html#cb16-69" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1  -0.3202     0.1160   -2.76   0.0058 ** </span></span>
-<span id="cb16-70"><a href="ip-weighting-and-marginal-structural-models.html#cb16-70" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb16-71"><a href="ip-weighting-and-marginal-structural-models.html#cb16-71" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb16-72"><a href="ip-weighting-and-marginal-structural-models.html#cb16-72" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-73"><a href="ip-weighting-and-marginal-structural-models.html#cb16-73" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb16-74"><a href="ip-weighting-and-marginal-structural-models.html#cb16-74" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-75"><a href="ip-weighting-and-marginal-structural-models.html#cb16-75" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
-<span id="cb16-76"><a href="ip-weighting-and-marginal-structural-models.html#cb16-76" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1778.4  on 1564  degrees of freedom</span></span>
-<span id="cb16-77"><a href="ip-weighting-and-marginal-structural-models.html#cb16-77" tabindex="-1"></a><span class="co">#&gt; AIC: 1782</span></span>
-<span id="cb16-78"><a href="ip-weighting-and-marginal-structural-models.html#cb16-78" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-79"><a href="ip-weighting-and-marginal-structural-models.html#cb16-79" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb16-80"><a href="ip-weighting-and-marginal-structural-models.html#cb16-80" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb16-81"><a href="ip-weighting-and-marginal-structural-models.html#cb16-81" tabindex="-1"></a></span>
-<span id="cb16-82"><a href="ip-weighting-and-marginal-structural-models.html#cb16-82" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>sw.a <span class="ot">&lt;-</span></span>
-<span id="cb16-83"><a href="ip-weighting-and-marginal-structural-models.html#cb16-83" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
-<span id="cb16-84"><a href="ip-weighting-and-marginal-structural-models.html#cb16-84" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
-<span id="cb16-85"><a href="ip-weighting-and-marginal-structural-models.html#cb16-85" tabindex="-1"></a></span>
-<span id="cb16-86"><a href="ip-weighting-and-marginal-structural-models.html#cb16-86" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>sw.a)</span>
-<span id="cb16-87"><a href="ip-weighting-and-marginal-structural-models.html#cb16-87" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb16-88"><a href="ip-weighting-and-marginal-structural-models.html#cb16-88" tabindex="-1"></a><span class="co">#&gt;    0.29    0.88    0.96    1.00    1.08    3.80</span></span>
-<span id="cb16-89"><a href="ip-weighting-and-marginal-structural-models.html#cb16-89" tabindex="-1"></a><span class="fu">sd</span>(nhefs.nmv<span class="sc">$</span>sw.a)</span>
-<span id="cb16-90"><a href="ip-weighting-and-marginal-structural-models.html#cb16-90" tabindex="-1"></a><span class="co">#&gt; [1] 0.271</span></span>
-<span id="cb16-91"><a href="ip-weighting-and-marginal-structural-models.html#cb16-91" tabindex="-1"></a></span>
-<span id="cb16-92"><a href="ip-weighting-and-marginal-structural-models.html#cb16-92" tabindex="-1"></a><span class="co"># Estimating parameters of a marginal structural mean model</span></span>
-<span id="cb16-93"><a href="ip-weighting-and-marginal-structural-models.html#cb16-93" tabindex="-1"></a>msm.emm <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
-<span id="cb16-94"><a href="ip-weighting-and-marginal-structural-models.html#cb16-94" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk) <span class="sc">+</span> <span class="fu">as.factor</span>(sex)</span>
-<span id="cb16-95"><a href="ip-weighting-and-marginal-structural-models.html#cb16-95" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(qsmk)<span class="sc">:</span><span class="fu">as.factor</span>(sex),</span>
-<span id="cb16-96"><a href="ip-weighting-and-marginal-structural-models.html#cb16-96" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
-<span id="cb16-97"><a href="ip-weighting-and-marginal-structural-models.html#cb16-97" tabindex="-1"></a>  <span class="at">weights =</span> sw.a,</span>
-<span id="cb16-98"><a href="ip-weighting-and-marginal-structural-models.html#cb16-98" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
-<span id="cb16-99"><a href="ip-weighting-and-marginal-structural-models.html#cb16-99" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb16-100"><a href="ip-weighting-and-marginal-structural-models.html#cb16-100" tabindex="-1"></a>)</span>
-<span id="cb16-101"><a href="ip-weighting-and-marginal-structural-models.html#cb16-101" tabindex="-1"></a><span class="fu">summary</span>(msm.emm)</span>
-<span id="cb16-102"><a href="ip-weighting-and-marginal-structural-models.html#cb16-102" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-103"><a href="ip-weighting-and-marginal-structural-models.html#cb16-103" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb16-104"><a href="ip-weighting-and-marginal-structural-models.html#cb16-104" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ as.factor(qsmk) + as.factor(sex) + </span></span>
-<span id="cb16-105"><a href="ip-weighting-and-marginal-structural-models.html#cb16-105" tabindex="-1"></a><span class="co">#&gt;     as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, </span></span>
-<span id="cb16-106"><a href="ip-weighting-and-marginal-structural-models.html#cb16-106" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb16-107"><a href="ip-weighting-and-marginal-structural-models.html#cb16-107" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-108"><a href="ip-weighting-and-marginal-structural-models.html#cb16-108" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb16-109"><a href="ip-weighting-and-marginal-structural-models.html#cb16-109" tabindex="-1"></a><span class="co">#&gt;                                  Estimate  Std.err  Wald Pr(&gt;|W|)    </span></span>
-<span id="cb16-110"><a href="ip-weighting-and-marginal-structural-models.html#cb16-110" tabindex="-1"></a><span class="co">#&gt; (Intercept)                       1.78445  0.30984 33.17  8.5e-09 ***</span></span>
-<span id="cb16-111"><a href="ip-weighting-and-marginal-structural-models.html#cb16-111" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1                  3.52198  0.65707 28.73  8.3e-08 ***</span></span>
-<span id="cb16-112"><a href="ip-weighting-and-marginal-structural-models.html#cb16-112" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1                  -0.00872  0.44882  0.00     0.98    </span></span>
-<span id="cb16-113"><a href="ip-weighting-and-marginal-structural-models.html#cb16-113" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948  1.04608  0.02     0.88    </span></span>
-<span id="cb16-114"><a href="ip-weighting-and-marginal-structural-models.html#cb16-114" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb16-115"><a href="ip-weighting-and-marginal-structural-models.html#cb16-115" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb16-116"><a href="ip-weighting-and-marginal-structural-models.html#cb16-116" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-117"><a href="ip-weighting-and-marginal-structural-models.html#cb16-117" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb16-118"><a href="ip-weighting-and-marginal-structural-models.html#cb16-118" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb16-119"><a href="ip-weighting-and-marginal-structural-models.html#cb16-119" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb16-120"><a href="ip-weighting-and-marginal-structural-models.html#cb16-120" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb16-121"><a href="ip-weighting-and-marginal-structural-models.html#cb16-121" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.8    3.71</span></span>
-<span id="cb16-122"><a href="ip-weighting-and-marginal-structural-models.html#cb16-122" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span>
-<span id="cb16-123"><a href="ip-weighting-and-marginal-structural-models.html#cb16-123" tabindex="-1"></a></span>
-<span id="cb16-124"><a href="ip-weighting-and-marginal-structural-models.html#cb16-124" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.emm)</span>
-<span id="cb16-125"><a href="ip-weighting-and-marginal-structural-models.html#cb16-125" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.emm))[, <span class="dv">2</span>]</span>
-<span id="cb16-126"><a href="ip-weighting-and-marginal-structural-models.html#cb16-126" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb16-127"><a href="ip-weighting-and-marginal-structural-models.html#cb16-127" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb16-128"><a href="ip-weighting-and-marginal-structural-models.html#cb16-128" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb16-129"><a href="ip-weighting-and-marginal-structural-models.html#cb16-129" tabindex="-1"></a><span class="co">#&gt;                                      beta    lcl   ucl</span></span>
-<span id="cb16-130"><a href="ip-weighting-and-marginal-structural-models.html#cb16-130" tabindex="-1"></a><span class="co">#&gt; (Intercept)                       1.78445  1.177 2.392</span></span>
-<span id="cb16-131"><a href="ip-weighting-and-marginal-structural-models.html#cb16-131" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1                  3.52198  2.234 4.810</span></span>
-<span id="cb16-132"><a href="ip-weighting-and-marginal-structural-models.html#cb16-132" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1                  -0.00872 -0.888 0.871</span></span>
-<span id="cb16-133"><a href="ip-weighting-and-marginal-structural-models.html#cb16-133" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 -2.210 1.891</span></span></code></pre></div>
+<div class="sourceCode" id="cb60"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb60-1"><a href="ip-weighting-and-marginal-structural-models.html#cb60-1" tabindex="-1"></a><span class="fu">table</span>(nhefs.nmv<span class="sc">$</span>sex)</span>
+<span id="cb60-2"><a href="ip-weighting-and-marginal-structural-models.html#cb60-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb60-3"><a href="ip-weighting-and-marginal-structural-models.html#cb60-3" tabindex="-1"></a><span class="co">#&gt;   0   1 </span></span>
+<span id="cb60-4"><a href="ip-weighting-and-marginal-structural-models.html#cb60-4" tabindex="-1"></a><span class="co">#&gt; 762 804</span></span></code></pre></div>
+<div class="sourceCode" id="cb61"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb61-1"><a href="ip-weighting-and-marginal-structural-models.html#cb61-1" tabindex="-1"></a></span>
+<span id="cb61-2"><a href="ip-weighting-and-marginal-structural-models.html#cb61-2" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights</span></span>
+<span id="cb61-3"><a href="ip-weighting-and-marginal-structural-models.html#cb61-3" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
+<span id="cb61-4"><a href="ip-weighting-and-marginal-structural-models.html#cb61-4" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
+<span id="cb61-5"><a href="ip-weighting-and-marginal-structural-models.html#cb61-5" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb61-6"><a href="ip-weighting-and-marginal-structural-models.html#cb61-6" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb61-7"><a href="ip-weighting-and-marginal-structural-models.html#cb61-7" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb61-8"><a href="ip-weighting-and-marginal-structural-models.html#cb61-8" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb61-9"><a href="ip-weighting-and-marginal-structural-models.html#cb61-9" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb61-10"><a href="ip-weighting-and-marginal-structural-models.html#cb61-10" tabindex="-1"></a>    <span class="at">data =</span> nhefs.nmv</span>
+<span id="cb61-11"><a href="ip-weighting-and-marginal-structural-models.html#cb61-11" tabindex="-1"></a>  )</span>
+<span id="cb61-12"><a href="ip-weighting-and-marginal-structural-models.html#cb61-12" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
+<span id="cb61-13"><a href="ip-weighting-and-marginal-structural-models.html#cb61-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb61-14"><a href="ip-weighting-and-marginal-structural-models.html#cb61-14" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb61-15"><a href="ip-weighting-and-marginal-structural-models.html#cb61-15" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
+<span id="cb61-16"><a href="ip-weighting-and-marginal-structural-models.html#cb61-16" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
+<span id="cb61-17"><a href="ip-weighting-and-marginal-structural-models.html#cb61-17" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb61-18"><a href="ip-weighting-and-marginal-structural-models.html#cb61-18" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv)</span></span>
+<span id="cb61-19"><a href="ip-weighting-and-marginal-structural-models.html#cb61-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb61-20"><a href="ip-weighting-and-marginal-structural-models.html#cb61-20" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb61-21"><a href="ip-weighting-and-marginal-structural-models.html#cb61-21" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb61-22"><a href="ip-weighting-and-marginal-structural-models.html#cb61-22" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -2.242519   1.380836   -1.62  0.10437    </span></span>
+<span id="cb61-23"><a href="ip-weighting-and-marginal-structural-models.html#cb61-23" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.527478   0.154050   -3.42  0.00062 ***</span></span>
+<span id="cb61-24"><a href="ip-weighting-and-marginal-structural-models.html#cb61-24" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.839264   0.210067   -4.00  6.5e-05 ***</span></span>
+<span id="cb61-25"><a href="ip-weighting-and-marginal-structural-models.html#cb61-25" tabindex="-1"></a><span class="co">#&gt; age                    0.121205   0.051266    2.36  0.01807 *  </span></span>
+<span id="cb61-26"><a href="ip-weighting-and-marginal-structural-models.html#cb61-26" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000825   0.000536   -1.54  0.12404    </span></span>
+<span id="cb61-27"><a href="ip-weighting-and-marginal-structural-models.html#cb61-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.028776   0.198351   -0.15  0.88465    </span></span>
+<span id="cb61-28"><a href="ip-weighting-and-marginal-structural-models.html#cb61-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.086432   0.178085    0.49  0.62744    </span></span>
+<span id="cb61-29"><a href="ip-weighting-and-marginal-structural-models.html#cb61-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.063601   0.273211    0.23  0.81592    </span></span>
+<span id="cb61-30"><a href="ip-weighting-and-marginal-structural-models.html#cb61-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.475961   0.226224    2.10  0.03538 *  </span></span>
+<span id="cb61-31"><a href="ip-weighting-and-marginal-structural-models.html#cb61-31" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.077270   0.015250   -5.07  4.0e-07 ***</span></span>
+<span id="cb61-32"><a href="ip-weighting-and-marginal-structural-models.html#cb61-32" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.001045   0.000287    3.65  0.00027 ***</span></span>
+<span id="cb61-33"><a href="ip-weighting-and-marginal-structural-models.html#cb61-33" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073597   0.027777   -2.65  0.00806 ** </span></span>
+<span id="cb61-34"><a href="ip-weighting-and-marginal-structural-models.html#cb61-34" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000844   0.000463    1.82  0.06840 .  </span></span>
+<span id="cb61-35"><a href="ip-weighting-and-marginal-structural-models.html#cb61-35" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.354841   0.180135    1.97  0.04885 *  </span></span>
+<span id="cb61-36"><a href="ip-weighting-and-marginal-structural-models.html#cb61-36" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.395704   0.187240    2.11  0.03457 *  </span></span>
+<span id="cb61-37"><a href="ip-weighting-and-marginal-structural-models.html#cb61-37" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.031944   0.132937    0.24  0.81010    </span></span>
+<span id="cb61-38"><a href="ip-weighting-and-marginal-structural-models.html#cb61-38" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.176784   0.214972    0.82  0.41087    </span></span>
+<span id="cb61-39"><a href="ip-weighting-and-marginal-structural-models.html#cb61-39" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.015236   0.026316   -0.58  0.56262    </span></span>
+<span id="cb61-40"><a href="ip-weighting-and-marginal-structural-models.html#cb61-40" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000135   0.000163    0.83  0.40737    </span></span>
+<span id="cb61-41"><a href="ip-weighting-and-marginal-structural-models.html#cb61-41" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb61-42"><a href="ip-weighting-and-marginal-structural-models.html#cb61-42" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb61-43"><a href="ip-weighting-and-marginal-structural-models.html#cb61-43" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb61-44"><a href="ip-weighting-and-marginal-structural-models.html#cb61-44" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb61-45"><a href="ip-weighting-and-marginal-structural-models.html#cb61-45" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb61-46"><a href="ip-weighting-and-marginal-structural-models.html#cb61-46" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb61-47"><a href="ip-weighting-and-marginal-structural-models.html#cb61-47" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1676.9  on 1547  degrees of freedom</span></span>
+<span id="cb61-48"><a href="ip-weighting-and-marginal-structural-models.html#cb61-48" tabindex="-1"></a><span class="co">#&gt; AIC: 1715</span></span>
+<span id="cb61-49"><a href="ip-weighting-and-marginal-structural-models.html#cb61-49" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb61-50"><a href="ip-weighting-and-marginal-structural-models.html#cb61-50" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb62"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb62-1"><a href="ip-weighting-and-marginal-structural-models.html#cb62-1" tabindex="-1"></a></span>
+<span id="cb62-2"><a href="ip-weighting-and-marginal-structural-models.html#cb62-2" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb62-3"><a href="ip-weighting-and-marginal-structural-models.html#cb62-3" tabindex="-1"></a></span>
+<span id="cb62-4"><a href="ip-weighting-and-marginal-structural-models.html#cb62-4" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights</span></span>
+<span id="cb62-5"><a href="ip-weighting-and-marginal-structural-models.html#cb62-5" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span></span>
+<span id="cb62-6"><a href="ip-weighting-and-marginal-structural-models.html#cb62-6" tabindex="-1"></a>  <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex), <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs.nmv)</span>
+<span id="cb62-7"><a href="ip-weighting-and-marginal-structural-models.html#cb62-7" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
+<span id="cb62-8"><a href="ip-weighting-and-marginal-structural-models.html#cb62-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb62-9"><a href="ip-weighting-and-marginal-structural-models.html#cb62-9" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb62-10"><a href="ip-weighting-and-marginal-structural-models.html#cb62-10" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv)</span></span>
+<span id="cb62-11"><a href="ip-weighting-and-marginal-structural-models.html#cb62-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb62-12"><a href="ip-weighting-and-marginal-structural-models.html#cb62-12" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb62-13"><a href="ip-weighting-and-marginal-structural-models.html#cb62-13" tabindex="-1"></a><span class="co">#&gt;                 Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb62-14"><a href="ip-weighting-and-marginal-structural-models.html#cb62-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)      -0.9016     0.0799  -11.28   &lt;2e-16 ***</span></span>
+<span id="cb62-15"><a href="ip-weighting-and-marginal-structural-models.html#cb62-15" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1  -0.3202     0.1160   -2.76   0.0058 ** </span></span>
+<span id="cb62-16"><a href="ip-weighting-and-marginal-structural-models.html#cb62-16" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb62-17"><a href="ip-weighting-and-marginal-structural-models.html#cb62-17" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb62-18"><a href="ip-weighting-and-marginal-structural-models.html#cb62-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb62-19"><a href="ip-weighting-and-marginal-structural-models.html#cb62-19" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb62-20"><a href="ip-weighting-and-marginal-structural-models.html#cb62-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb62-21"><a href="ip-weighting-and-marginal-structural-models.html#cb62-21" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1786.1  on 1565  degrees of freedom</span></span>
+<span id="cb62-22"><a href="ip-weighting-and-marginal-structural-models.html#cb62-22" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1778.4  on 1564  degrees of freedom</span></span>
+<span id="cb62-23"><a href="ip-weighting-and-marginal-structural-models.html#cb62-23" tabindex="-1"></a><span class="co">#&gt; AIC: 1782</span></span>
+<span id="cb62-24"><a href="ip-weighting-and-marginal-structural-models.html#cb62-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb62-25"><a href="ip-weighting-and-marginal-structural-models.html#cb62-25" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb63"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb63-1"><a href="ip-weighting-and-marginal-structural-models.html#cb63-1" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb63-2"><a href="ip-weighting-and-marginal-structural-models.html#cb63-2" tabindex="-1"></a></span>
+<span id="cb63-3"><a href="ip-weighting-and-marginal-structural-models.html#cb63-3" tabindex="-1"></a>nhefs.nmv<span class="sc">$</span>sw.a <span class="ot">&lt;-</span></span>
+<span id="cb63-4"><a href="ip-weighting-and-marginal-structural-models.html#cb63-4" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs.nmv<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
+<span id="cb63-5"><a href="ip-weighting-and-marginal-structural-models.html#cb63-5" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
+<span id="cb63-6"><a href="ip-weighting-and-marginal-structural-models.html#cb63-6" tabindex="-1"></a></span>
+<span id="cb63-7"><a href="ip-weighting-and-marginal-structural-models.html#cb63-7" tabindex="-1"></a><span class="fu">summary</span>(nhefs.nmv<span class="sc">$</span>sw.a)</span>
+<span id="cb63-8"><a href="ip-weighting-and-marginal-structural-models.html#cb63-8" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb63-9"><a href="ip-weighting-and-marginal-structural-models.html#cb63-9" tabindex="-1"></a><span class="co">#&gt;    0.29    0.88    0.96    1.00    1.08    3.80</span></span></code></pre></div>
+<div class="sourceCode" id="cb64"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb64-1"><a href="ip-weighting-and-marginal-structural-models.html#cb64-1" tabindex="-1"></a><span class="fu">sd</span>(nhefs.nmv<span class="sc">$</span>sw.a)</span>
+<span id="cb64-2"><a href="ip-weighting-and-marginal-structural-models.html#cb64-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.271</span></span></code></pre></div>
+<div class="sourceCode" id="cb65"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb65-1"><a href="ip-weighting-and-marginal-structural-models.html#cb65-1" tabindex="-1"></a></span>
+<span id="cb65-2"><a href="ip-weighting-and-marginal-structural-models.html#cb65-2" tabindex="-1"></a><span class="co"># Estimating parameters of a marginal structural mean model</span></span>
+<span id="cb65-3"><a href="ip-weighting-and-marginal-structural-models.html#cb65-3" tabindex="-1"></a>msm.emm <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
+<span id="cb65-4"><a href="ip-weighting-and-marginal-structural-models.html#cb65-4" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk) <span class="sc">+</span> <span class="fu">as.factor</span>(sex)</span>
+<span id="cb65-5"><a href="ip-weighting-and-marginal-structural-models.html#cb65-5" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(qsmk)<span class="sc">:</span><span class="fu">as.factor</span>(sex),</span>
+<span id="cb65-6"><a href="ip-weighting-and-marginal-structural-models.html#cb65-6" tabindex="-1"></a>  <span class="at">data =</span> nhefs.nmv,</span>
+<span id="cb65-7"><a href="ip-weighting-and-marginal-structural-models.html#cb65-7" tabindex="-1"></a>  <span class="at">weights =</span> sw.a,</span>
+<span id="cb65-8"><a href="ip-weighting-and-marginal-structural-models.html#cb65-8" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
+<span id="cb65-9"><a href="ip-weighting-and-marginal-structural-models.html#cb65-9" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb65-10"><a href="ip-weighting-and-marginal-structural-models.html#cb65-10" tabindex="-1"></a>)</span>
+<span id="cb65-11"><a href="ip-weighting-and-marginal-structural-models.html#cb65-11" tabindex="-1"></a><span class="fu">summary</span>(msm.emm)</span>
+<span id="cb65-12"><a href="ip-weighting-and-marginal-structural-models.html#cb65-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb65-13"><a href="ip-weighting-and-marginal-structural-models.html#cb65-13" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb65-14"><a href="ip-weighting-and-marginal-structural-models.html#cb65-14" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ as.factor(qsmk) + as.factor(sex) + </span></span>
+<span id="cb65-15"><a href="ip-weighting-and-marginal-structural-models.html#cb65-15" tabindex="-1"></a><span class="co">#&gt;     as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, </span></span>
+<span id="cb65-16"><a href="ip-weighting-and-marginal-structural-models.html#cb65-16" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb65-17"><a href="ip-weighting-and-marginal-structural-models.html#cb65-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb65-18"><a href="ip-weighting-and-marginal-structural-models.html#cb65-18" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb65-19"><a href="ip-weighting-and-marginal-structural-models.html#cb65-19" tabindex="-1"></a><span class="co">#&gt;                                  Estimate  Std.err  Wald Pr(&gt;|W|)    </span></span>
+<span id="cb65-20"><a href="ip-weighting-and-marginal-structural-models.html#cb65-20" tabindex="-1"></a><span class="co">#&gt; (Intercept)                       1.78445  0.30984 33.17  8.5e-09 ***</span></span>
+<span id="cb65-21"><a href="ip-weighting-and-marginal-structural-models.html#cb65-21" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1                  3.52198  0.65707 28.73  8.3e-08 ***</span></span>
+<span id="cb65-22"><a href="ip-weighting-and-marginal-structural-models.html#cb65-22" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1                  -0.00872  0.44882  0.00     0.98    </span></span>
+<span id="cb65-23"><a href="ip-weighting-and-marginal-structural-models.html#cb65-23" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948  1.04608  0.02     0.88    </span></span>
+<span id="cb65-24"><a href="ip-weighting-and-marginal-structural-models.html#cb65-24" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb65-25"><a href="ip-weighting-and-marginal-structural-models.html#cb65-25" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb65-26"><a href="ip-weighting-and-marginal-structural-models.html#cb65-26" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb65-27"><a href="ip-weighting-and-marginal-structural-models.html#cb65-27" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb65-28"><a href="ip-weighting-and-marginal-structural-models.html#cb65-28" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb65-29"><a href="ip-weighting-and-marginal-structural-models.html#cb65-29" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb65-30"><a href="ip-weighting-and-marginal-structural-models.html#cb65-30" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb65-31"><a href="ip-weighting-and-marginal-structural-models.html#cb65-31" tabindex="-1"></a><span class="co">#&gt; (Intercept)     60.8    3.71</span></span>
+<span id="cb65-32"><a href="ip-weighting-and-marginal-structural-models.html#cb65-32" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb66"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb66-1"><a href="ip-weighting-and-marginal-structural-models.html#cb66-1" tabindex="-1"></a></span>
+<span id="cb66-2"><a href="ip-weighting-and-marginal-structural-models.html#cb66-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.emm)</span>
+<span id="cb66-3"><a href="ip-weighting-and-marginal-structural-models.html#cb66-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.emm))[, <span class="dv">2</span>]</span>
+<span id="cb66-4"><a href="ip-weighting-and-marginal-structural-models.html#cb66-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb66-5"><a href="ip-weighting-and-marginal-structural-models.html#cb66-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb66-6"><a href="ip-weighting-and-marginal-structural-models.html#cb66-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb66-7"><a href="ip-weighting-and-marginal-structural-models.html#cb66-7" tabindex="-1"></a><span class="co">#&gt;                                      beta    lcl   ucl</span></span>
+<span id="cb66-8"><a href="ip-weighting-and-marginal-structural-models.html#cb66-8" tabindex="-1"></a><span class="co">#&gt; (Intercept)                       1.78445  1.177 2.392</span></span>
+<span id="cb66-9"><a href="ip-weighting-and-marginal-structural-models.html#cb66-9" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1                  3.52198  2.234 4.810</span></span>
+<span id="cb66-10"><a href="ip-weighting-and-marginal-structural-models.html#cb66-10" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1                  -0.00872 -0.888 0.871</span></span>
+<span id="cb66-11"><a href="ip-weighting-and-marginal-structural-models.html#cb66-11" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 -2.210 1.891</span></span></code></pre></div>
 </div>
 <div id="program-12.7" class="section level2 hasAnchor">
 <h2>Program 12.7<a href="ip-weighting-and-marginal-structural-models.html#program-12.7" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -998,228 +998,228 @@ <h2>Program 12.7<a href="ip-weighting-and-marginal-structural-models.html#progra
 <li>Estimating IP weights to adjust for selection bias due to censoring</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb17"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb17-1"><a href="ip-weighting-and-marginal-structural-models.html#cb17-1" tabindex="-1"></a><span class="fu">table</span>(nhefs<span class="sc">$</span>qsmk, nhefs<span class="sc">$</span>cens)</span>
-<span id="cb17-2"><a href="ip-weighting-and-marginal-structural-models.html#cb17-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
-<span id="cb17-3"><a href="ip-weighting-and-marginal-structural-models.html#cb17-3" tabindex="-1"></a><span class="co">#&gt;        0    1</span></span>
-<span id="cb17-4"><a href="ip-weighting-and-marginal-structural-models.html#cb17-4" tabindex="-1"></a><span class="co">#&gt;   0 1163   38</span></span>
-<span id="cb17-5"><a href="ip-weighting-and-marginal-structural-models.html#cb17-5" tabindex="-1"></a><span class="co">#&gt;   1  403   25</span></span>
-<span id="cb17-6"><a href="ip-weighting-and-marginal-structural-models.html#cb17-6" tabindex="-1"></a></span>
-<span id="cb17-7"><a href="ip-weighting-and-marginal-structural-models.html#cb17-7" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>wt71)</span>
-<span id="cb17-8"><a href="ip-weighting-and-marginal-structural-models.html#cb17-8" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb17-9"><a href="ip-weighting-and-marginal-structural-models.html#cb17-9" tabindex="-1"></a><span class="co">#&gt;    39.6    59.5    69.2    70.8    79.8   151.7</span></span>
-<span id="cb17-10"><a href="ip-weighting-and-marginal-structural-models.html#cb17-10" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>wt71)</span>
-<span id="cb17-11"><a href="ip-weighting-and-marginal-structural-models.html#cb17-11" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb17-12"><a href="ip-weighting-and-marginal-structural-models.html#cb17-12" tabindex="-1"></a><span class="co">#&gt;    36.2    63.1    72.1    76.6    87.9   169.2</span></span>
-<span id="cb17-13"><a href="ip-weighting-and-marginal-structural-models.html#cb17-13" tabindex="-1"></a></span>
-<span id="cb17-14"><a href="ip-weighting-and-marginal-structural-models.html#cb17-14" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for A</span></span>
-<span id="cb17-15"><a href="ip-weighting-and-marginal-structural-models.html#cb17-15" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
-<span id="cb17-16"><a href="ip-weighting-and-marginal-structural-models.html#cb17-16" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
-<span id="cb17-17"><a href="ip-weighting-and-marginal-structural-models.html#cb17-17" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb17-18"><a href="ip-weighting-and-marginal-structural-models.html#cb17-18" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb17-19"><a href="ip-weighting-and-marginal-structural-models.html#cb17-19" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb17-20"><a href="ip-weighting-and-marginal-structural-models.html#cb17-20" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb17-21"><a href="ip-weighting-and-marginal-structural-models.html#cb17-21" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb17-22"><a href="ip-weighting-and-marginal-structural-models.html#cb17-22" tabindex="-1"></a>    <span class="at">data =</span> nhefs</span>
-<span id="cb17-23"><a href="ip-weighting-and-marginal-structural-models.html#cb17-23" tabindex="-1"></a>  )</span>
-<span id="cb17-24"><a href="ip-weighting-and-marginal-structural-models.html#cb17-24" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
-<span id="cb17-25"><a href="ip-weighting-and-marginal-structural-models.html#cb17-25" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-26"><a href="ip-weighting-and-marginal-structural-models.html#cb17-26" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb17-27"><a href="ip-weighting-and-marginal-structural-models.html#cb17-27" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
-<span id="cb17-28"><a href="ip-weighting-and-marginal-structural-models.html#cb17-28" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
-<span id="cb17-29"><a href="ip-weighting-and-marginal-structural-models.html#cb17-29" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb17-30"><a href="ip-weighting-and-marginal-structural-models.html#cb17-30" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs)</span></span>
-<span id="cb17-31"><a href="ip-weighting-and-marginal-structural-models.html#cb17-31" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-32"><a href="ip-weighting-and-marginal-structural-models.html#cb17-32" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb17-33"><a href="ip-weighting-and-marginal-structural-models.html#cb17-33" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb17-34"><a href="ip-weighting-and-marginal-structural-models.html#cb17-34" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -1.988902   1.241279   -1.60  0.10909    </span></span>
-<span id="cb17-35"><a href="ip-weighting-and-marginal-structural-models.html#cb17-35" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.507522   0.148232   -3.42  0.00062 ***</span></span>
-<span id="cb17-36"><a href="ip-weighting-and-marginal-structural-models.html#cb17-36" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.850231   0.205872   -4.13  3.6e-05 ***</span></span>
-<span id="cb17-37"><a href="ip-weighting-and-marginal-structural-models.html#cb17-37" tabindex="-1"></a><span class="co">#&gt; age                    0.103013   0.048900    2.11  0.03515 *  </span></span>
-<span id="cb17-38"><a href="ip-weighting-and-marginal-structural-models.html#cb17-38" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000605   0.000507   -1.19  0.23297    </span></span>
-<span id="cb17-39"><a href="ip-weighting-and-marginal-structural-models.html#cb17-39" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.098320   0.190655   -0.52  0.60607    </span></span>
-<span id="cb17-40"><a href="ip-weighting-and-marginal-structural-models.html#cb17-40" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.015699   0.170714    0.09  0.92673    </span></span>
-<span id="cb17-41"><a href="ip-weighting-and-marginal-structural-models.html#cb17-41" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4 -0.042526   0.264276   -0.16  0.87216    </span></span>
-<span id="cb17-42"><a href="ip-weighting-and-marginal-structural-models.html#cb17-42" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.379663   0.220395    1.72  0.08495 .  </span></span>
-<span id="cb17-43"><a href="ip-weighting-and-marginal-structural-models.html#cb17-43" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.065156   0.014759   -4.41  1.0e-05 ***</span></span>
-<span id="cb17-44"><a href="ip-weighting-and-marginal-structural-models.html#cb17-44" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.000846   0.000276    3.07  0.00216 ** </span></span>
-<span id="cb17-45"><a href="ip-weighting-and-marginal-structural-models.html#cb17-45" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073371   0.026996   -2.72  0.00657 ** </span></span>
-<span id="cb17-46"><a href="ip-weighting-and-marginal-structural-models.html#cb17-46" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000838   0.000443    1.89  0.05867 .  </span></span>
-<span id="cb17-47"><a href="ip-weighting-and-marginal-structural-models.html#cb17-47" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.291412   0.173554    1.68  0.09314 .  </span></span>
-<span id="cb17-48"><a href="ip-weighting-and-marginal-structural-models.html#cb17-48" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.355052   0.179929    1.97  0.04846 *  </span></span>
-<span id="cb17-49"><a href="ip-weighting-and-marginal-structural-models.html#cb17-49" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.010875   0.129832    0.08  0.93324    </span></span>
-<span id="cb17-50"><a href="ip-weighting-and-marginal-structural-models.html#cb17-50" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.068312   0.208727    0.33  0.74346    </span></span>
-<span id="cb17-51"><a href="ip-weighting-and-marginal-structural-models.html#cb17-51" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.012848   0.022283   -0.58  0.56423    </span></span>
-<span id="cb17-52"><a href="ip-weighting-and-marginal-structural-models.html#cb17-52" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000121   0.000135    0.89  0.37096    </span></span>
-<span id="cb17-53"><a href="ip-weighting-and-marginal-structural-models.html#cb17-53" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb17-54"><a href="ip-weighting-and-marginal-structural-models.html#cb17-54" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb17-55"><a href="ip-weighting-and-marginal-structural-models.html#cb17-55" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-56"><a href="ip-weighting-and-marginal-structural-models.html#cb17-56" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb17-57"><a href="ip-weighting-and-marginal-structural-models.html#cb17-57" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-58"><a href="ip-weighting-and-marginal-structural-models.html#cb17-58" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
-<span id="cb17-59"><a href="ip-weighting-and-marginal-structural-models.html#cb17-59" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1766.7  on 1610  degrees of freedom</span></span>
-<span id="cb17-60"><a href="ip-weighting-and-marginal-structural-models.html#cb17-60" tabindex="-1"></a><span class="co">#&gt; AIC: 1805</span></span>
-<span id="cb17-61"><a href="ip-weighting-and-marginal-structural-models.html#cb17-61" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-62"><a href="ip-weighting-and-marginal-structural-models.html#cb17-62" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb17-63"><a href="ip-weighting-and-marginal-structural-models.html#cb17-63" tabindex="-1"></a></span>
-<span id="cb17-64"><a href="ip-weighting-and-marginal-structural-models.html#cb17-64" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb17-65"><a href="ip-weighting-and-marginal-structural-models.html#cb17-65" tabindex="-1"></a></span>
-<span id="cb17-66"><a href="ip-weighting-and-marginal-structural-models.html#cb17-66" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights for A</span></span>
-<span id="cb17-67"><a href="ip-weighting-and-marginal-structural-models.html#cb17-67" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs)</span>
-<span id="cb17-68"><a href="ip-weighting-and-marginal-structural-models.html#cb17-68" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
-<span id="cb17-69"><a href="ip-weighting-and-marginal-structural-models.html#cb17-69" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-70"><a href="ip-weighting-and-marginal-structural-models.html#cb17-70" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb17-71"><a href="ip-weighting-and-marginal-structural-models.html#cb17-71" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs)</span></span>
-<span id="cb17-72"><a href="ip-weighting-and-marginal-structural-models.html#cb17-72" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-73"><a href="ip-weighting-and-marginal-structural-models.html#cb17-73" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb17-74"><a href="ip-weighting-and-marginal-structural-models.html#cb17-74" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb17-75"><a href="ip-weighting-and-marginal-structural-models.html#cb17-75" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.0318     0.0563   -18.3   &lt;2e-16 ***</span></span>
-<span id="cb17-76"><a href="ip-weighting-and-marginal-structural-models.html#cb17-76" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb17-77"><a href="ip-weighting-and-marginal-structural-models.html#cb17-77" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb17-78"><a href="ip-weighting-and-marginal-structural-models.html#cb17-78" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-79"><a href="ip-weighting-and-marginal-structural-models.html#cb17-79" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb17-80"><a href="ip-weighting-and-marginal-structural-models.html#cb17-80" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-81"><a href="ip-weighting-and-marginal-structural-models.html#cb17-81" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
-<span id="cb17-82"><a href="ip-weighting-and-marginal-structural-models.html#cb17-82" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1876.3  on 1628  degrees of freedom</span></span>
-<span id="cb17-83"><a href="ip-weighting-and-marginal-structural-models.html#cb17-83" tabindex="-1"></a><span class="co">#&gt; AIC: 1878</span></span>
-<span id="cb17-84"><a href="ip-weighting-and-marginal-structural-models.html#cb17-84" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-85"><a href="ip-weighting-and-marginal-structural-models.html#cb17-85" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb17-86"><a href="ip-weighting-and-marginal-structural-models.html#cb17-86" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb17-87"><a href="ip-weighting-and-marginal-structural-models.html#cb17-87" tabindex="-1"></a></span>
-<span id="cb17-88"><a href="ip-weighting-and-marginal-structural-models.html#cb17-88" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for C</span></span>
-<span id="cb17-89"><a href="ip-weighting-and-marginal-structural-models.html#cb17-89" tabindex="-1"></a>denom.cens <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
-<span id="cb17-90"><a href="ip-weighting-and-marginal-structural-models.html#cb17-90" tabindex="-1"></a>  cens <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk) <span class="sc">+</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span></span>
-<span id="cb17-91"><a href="ip-weighting-and-marginal-structural-models.html#cb17-91" tabindex="-1"></a>    <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb17-92"><a href="ip-weighting-and-marginal-structural-models.html#cb17-92" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb17-93"><a href="ip-weighting-and-marginal-structural-models.html#cb17-93" tabindex="-1"></a>    <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
-<span id="cb17-94"><a href="ip-weighting-and-marginal-structural-models.html#cb17-94" tabindex="-1"></a>    <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
-<span id="cb17-95"><a href="ip-weighting-and-marginal-structural-models.html#cb17-95" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
-<span id="cb17-96"><a href="ip-weighting-and-marginal-structural-models.html#cb17-96" tabindex="-1"></a>  <span class="at">data =</span> nhefs</span>
-<span id="cb17-97"><a href="ip-weighting-and-marginal-structural-models.html#cb17-97" tabindex="-1"></a>)</span>
-<span id="cb17-98"><a href="ip-weighting-and-marginal-structural-models.html#cb17-98" tabindex="-1"></a><span class="fu">summary</span>(denom.cens)</span>
-<span id="cb17-99"><a href="ip-weighting-and-marginal-structural-models.html#cb17-99" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-100"><a href="ip-weighting-and-marginal-structural-models.html#cb17-100" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb17-101"><a href="ip-weighting-and-marginal-structural-models.html#cb17-101" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + </span></span>
-<span id="cb17-102"><a href="ip-weighting-and-marginal-structural-models.html#cb17-102" tabindex="-1"></a><span class="co">#&gt;     age + I(age^2) + as.factor(education) + smokeintensity + </span></span>
-<span id="cb17-103"><a href="ip-weighting-and-marginal-structural-models.html#cb17-103" tabindex="-1"></a><span class="co">#&gt;     I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + </span></span>
-<span id="cb17-104"><a href="ip-weighting-and-marginal-structural-models.html#cb17-104" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71^2), family = binomial(), </span></span>
-<span id="cb17-105"><a href="ip-weighting-and-marginal-structural-models.html#cb17-105" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
-<span id="cb17-106"><a href="ip-weighting-and-marginal-structural-models.html#cb17-106" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-107"><a href="ip-weighting-and-marginal-structural-models.html#cb17-107" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb17-108"><a href="ip-weighting-and-marginal-structural-models.html#cb17-108" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)   </span></span>
-<span id="cb17-109"><a href="ip-weighting-and-marginal-structural-models.html#cb17-109" tabindex="-1"></a><span class="co">#&gt; (Intercept)            4.014466   2.576106    1.56   0.1192   </span></span>
-<span id="cb17-110"><a href="ip-weighting-and-marginal-structural-models.html#cb17-110" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1       0.516867   0.287716    1.80   0.0724 . </span></span>
-<span id="cb17-111"><a href="ip-weighting-and-marginal-structural-models.html#cb17-111" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1        0.057313   0.330278    0.17   0.8622   </span></span>
-<span id="cb17-112"><a href="ip-weighting-and-marginal-structural-models.html#cb17-112" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.012271   0.452489   -0.03   0.9784   </span></span>
-<span id="cb17-113"><a href="ip-weighting-and-marginal-structural-models.html#cb17-113" tabindex="-1"></a><span class="co">#&gt; age                   -0.269729   0.117465   -2.30   0.0217 * </span></span>
-<span id="cb17-114"><a href="ip-weighting-and-marginal-structural-models.html#cb17-114" tabindex="-1"></a><span class="co">#&gt; I(age^2)               0.002884   0.001114    2.59   0.0096 **</span></span>
-<span id="cb17-115"><a href="ip-weighting-and-marginal-structural-models.html#cb17-115" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.440788   0.419399   -1.05   0.2933   </span></span>
-<span id="cb17-116"><a href="ip-weighting-and-marginal-structural-models.html#cb17-116" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3 -0.164688   0.370547   -0.44   0.6567   </span></span>
-<span id="cb17-117"><a href="ip-weighting-and-marginal-structural-models.html#cb17-117" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.138447   0.569797    0.24   0.8080   </span></span>
-<span id="cb17-118"><a href="ip-weighting-and-marginal-structural-models.html#cb17-118" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5 -0.382382   0.560181   -0.68   0.4949   </span></span>
-<span id="cb17-119"><a href="ip-weighting-and-marginal-structural-models.html#cb17-119" tabindex="-1"></a><span class="co">#&gt; smokeintensity         0.015712   0.034732    0.45   0.6510   </span></span>
-<span id="cb17-120"><a href="ip-weighting-and-marginal-structural-models.html#cb17-120" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)   -0.000113   0.000606   -0.19   0.8517   </span></span>
-<span id="cb17-121"><a href="ip-weighting-and-marginal-structural-models.html#cb17-121" tabindex="-1"></a><span class="co">#&gt; smokeyrs               0.078597   0.074958    1.05   0.2944   </span></span>
-<span id="cb17-122"><a href="ip-weighting-and-marginal-structural-models.html#cb17-122" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)         -0.000557   0.001032   -0.54   0.5894   </span></span>
-<span id="cb17-123"><a href="ip-weighting-and-marginal-structural-models.html#cb17-123" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1  -0.971471   0.387810   -2.51   0.0122 * </span></span>
-<span id="cb17-124"><a href="ip-weighting-and-marginal-structural-models.html#cb17-124" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2  -0.583989   0.372313   -1.57   0.1168   </span></span>
-<span id="cb17-125"><a href="ip-weighting-and-marginal-structural-models.html#cb17-125" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1    -0.247479   0.325455   -0.76   0.4470   </span></span>
-<span id="cb17-126"><a href="ip-weighting-and-marginal-structural-models.html#cb17-126" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.706583   0.396458    1.78   0.0747 . </span></span>
-<span id="cb17-127"><a href="ip-weighting-and-marginal-structural-models.html#cb17-127" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.087887   0.040012   -2.20   0.0281 * </span></span>
-<span id="cb17-128"><a href="ip-weighting-and-marginal-structural-models.html#cb17-128" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000635   0.000226    2.81   0.0049 **</span></span>
-<span id="cb17-129"><a href="ip-weighting-and-marginal-structural-models.html#cb17-129" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb17-130"><a href="ip-weighting-and-marginal-structural-models.html#cb17-130" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb17-131"><a href="ip-weighting-and-marginal-structural-models.html#cb17-131" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-132"><a href="ip-weighting-and-marginal-structural-models.html#cb17-132" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb17-133"><a href="ip-weighting-and-marginal-structural-models.html#cb17-133" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-134"><a href="ip-weighting-and-marginal-structural-models.html#cb17-134" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
-<span id="cb17-135"><a href="ip-weighting-and-marginal-structural-models.html#cb17-135" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 465.36  on 1609  degrees of freedom</span></span>
-<span id="cb17-136"><a href="ip-weighting-and-marginal-structural-models.html#cb17-136" tabindex="-1"></a><span class="co">#&gt; AIC: 505.4</span></span>
-<span id="cb17-137"><a href="ip-weighting-and-marginal-structural-models.html#cb17-137" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-138"><a href="ip-weighting-and-marginal-structural-models.html#cb17-138" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 7</span></span>
-<span id="cb17-139"><a href="ip-weighting-and-marginal-structural-models.html#cb17-139" tabindex="-1"></a></span>
-<span id="cb17-140"><a href="ip-weighting-and-marginal-structural-models.html#cb17-140" tabindex="-1"></a>pd.cens <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(denom.cens, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb17-141"><a href="ip-weighting-and-marginal-structural-models.html#cb17-141" tabindex="-1"></a></span>
-<span id="cb17-142"><a href="ip-weighting-and-marginal-structural-models.html#cb17-142" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights for C</span></span>
-<span id="cb17-143"><a href="ip-weighting-and-marginal-structural-models.html#cb17-143" tabindex="-1"></a>numer.cens <span class="ot">&lt;-</span></span>
-<span id="cb17-144"><a href="ip-weighting-and-marginal-structural-models.html#cb17-144" tabindex="-1"></a>  <span class="fu">glm</span>(cens <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk), <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs)</span>
-<span id="cb17-145"><a href="ip-weighting-and-marginal-structural-models.html#cb17-145" tabindex="-1"></a><span class="fu">summary</span>(numer.cens)</span>
-<span id="cb17-146"><a href="ip-weighting-and-marginal-structural-models.html#cb17-146" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-147"><a href="ip-weighting-and-marginal-structural-models.html#cb17-147" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb17-148"><a href="ip-weighting-and-marginal-structural-models.html#cb17-148" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens ~ as.factor(qsmk), family = binomial(), data = nhefs)</span></span>
-<span id="cb17-149"><a href="ip-weighting-and-marginal-structural-models.html#cb17-149" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-150"><a href="ip-weighting-and-marginal-structural-models.html#cb17-150" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb17-151"><a href="ip-weighting-and-marginal-structural-models.html#cb17-151" tabindex="-1"></a><span class="co">#&gt;                  Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb17-152"><a href="ip-weighting-and-marginal-structural-models.html#cb17-152" tabindex="-1"></a><span class="co">#&gt; (Intercept)        -3.421      0.165  -20.75   &lt;2e-16 ***</span></span>
-<span id="cb17-153"><a href="ip-weighting-and-marginal-structural-models.html#cb17-153" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1    0.641      0.264    2.43    0.015 *  </span></span>
-<span id="cb17-154"><a href="ip-weighting-and-marginal-structural-models.html#cb17-154" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb17-155"><a href="ip-weighting-and-marginal-structural-models.html#cb17-155" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb17-156"><a href="ip-weighting-and-marginal-structural-models.html#cb17-156" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-157"><a href="ip-weighting-and-marginal-structural-models.html#cb17-157" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb17-158"><a href="ip-weighting-and-marginal-structural-models.html#cb17-158" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-159"><a href="ip-weighting-and-marginal-structural-models.html#cb17-159" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
-<span id="cb17-160"><a href="ip-weighting-and-marginal-structural-models.html#cb17-160" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 527.76  on 1627  degrees of freedom</span></span>
-<span id="cb17-161"><a href="ip-weighting-and-marginal-structural-models.html#cb17-161" tabindex="-1"></a><span class="co">#&gt; AIC: 531.8</span></span>
-<span id="cb17-162"><a href="ip-weighting-and-marginal-structural-models.html#cb17-162" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-163"><a href="ip-weighting-and-marginal-structural-models.html#cb17-163" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 6</span></span>
-<span id="cb17-164"><a href="ip-weighting-and-marginal-structural-models.html#cb17-164" tabindex="-1"></a>pn.cens <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(numer.cens, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
-<span id="cb17-165"><a href="ip-weighting-and-marginal-structural-models.html#cb17-165" tabindex="-1"></a></span>
-<span id="cb17-166"><a href="ip-weighting-and-marginal-structural-models.html#cb17-166" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.a <span class="ot">&lt;-</span></span>
-<span id="cb17-167"><a href="ip-weighting-and-marginal-structural-models.html#cb17-167" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
-<span id="cb17-168"><a href="ip-weighting-and-marginal-structural-models.html#cb17-168" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
-<span id="cb17-169"><a href="ip-weighting-and-marginal-structural-models.html#cb17-169" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.c <span class="ot">&lt;-</span> pn.cens <span class="sc">/</span> pd.cens</span>
-<span id="cb17-170"><a href="ip-weighting-and-marginal-structural-models.html#cb17-170" tabindex="-1"></a>nhefs<span class="sc">$</span>sw <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>sw.c <span class="sc">*</span> nhefs<span class="sc">$</span>sw.a</span>
-<span id="cb17-171"><a href="ip-weighting-and-marginal-structural-models.html#cb17-171" tabindex="-1"></a></span>
-<span id="cb17-172"><a href="ip-weighting-and-marginal-structural-models.html#cb17-172" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.a)</span>
-<span id="cb17-173"><a href="ip-weighting-and-marginal-structural-models.html#cb17-173" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb17-174"><a href="ip-weighting-and-marginal-structural-models.html#cb17-174" tabindex="-1"></a><span class="co">#&gt;    0.33    0.86    0.95    1.00    1.08    4.21</span></span>
-<span id="cb17-175"><a href="ip-weighting-and-marginal-structural-models.html#cb17-175" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw.a)</span>
-<span id="cb17-176"><a href="ip-weighting-and-marginal-structural-models.html#cb17-176" tabindex="-1"></a><span class="co">#&gt; [1] 0.284</span></span>
-<span id="cb17-177"><a href="ip-weighting-and-marginal-structural-models.html#cb17-177" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.c)</span>
-<span id="cb17-178"><a href="ip-weighting-and-marginal-structural-models.html#cb17-178" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb17-179"><a href="ip-weighting-and-marginal-structural-models.html#cb17-179" tabindex="-1"></a><span class="co">#&gt;    0.94    0.98    0.99    1.01    1.01    7.58</span></span>
-<span id="cb17-180"><a href="ip-weighting-and-marginal-structural-models.html#cb17-180" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw.c)</span>
-<span id="cb17-181"><a href="ip-weighting-and-marginal-structural-models.html#cb17-181" tabindex="-1"></a><span class="co">#&gt; [1] 0.178</span></span>
-<span id="cb17-182"><a href="ip-weighting-and-marginal-structural-models.html#cb17-182" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw)</span>
-<span id="cb17-183"><a href="ip-weighting-and-marginal-structural-models.html#cb17-183" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb17-184"><a href="ip-weighting-and-marginal-structural-models.html#cb17-184" tabindex="-1"></a><span class="co">#&gt;    0.35    0.86    0.94    1.01    1.08   12.86</span></span>
-<span id="cb17-185"><a href="ip-weighting-and-marginal-structural-models.html#cb17-185" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw)</span>
-<span id="cb17-186"><a href="ip-weighting-and-marginal-structural-models.html#cb17-186" tabindex="-1"></a><span class="co">#&gt; [1] 0.411</span></span>
-<span id="cb17-187"><a href="ip-weighting-and-marginal-structural-models.html#cb17-187" tabindex="-1"></a></span>
-<span id="cb17-188"><a href="ip-weighting-and-marginal-structural-models.html#cb17-188" tabindex="-1"></a>msm.sw <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
-<span id="cb17-189"><a href="ip-weighting-and-marginal-structural-models.html#cb17-189" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
-<span id="cb17-190"><a href="ip-weighting-and-marginal-structural-models.html#cb17-190" tabindex="-1"></a>  <span class="at">data =</span> nhefs,</span>
-<span id="cb17-191"><a href="ip-weighting-and-marginal-structural-models.html#cb17-191" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
-<span id="cb17-192"><a href="ip-weighting-and-marginal-structural-models.html#cb17-192" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
-<span id="cb17-193"><a href="ip-weighting-and-marginal-structural-models.html#cb17-193" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
-<span id="cb17-194"><a href="ip-weighting-and-marginal-structural-models.html#cb17-194" tabindex="-1"></a>)</span>
-<span id="cb17-195"><a href="ip-weighting-and-marginal-structural-models.html#cb17-195" tabindex="-1"></a><span class="fu">summary</span>(msm.sw)</span>
-<span id="cb17-196"><a href="ip-weighting-and-marginal-structural-models.html#cb17-196" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-197"><a href="ip-weighting-and-marginal-structural-models.html#cb17-197" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb17-198"><a href="ip-weighting-and-marginal-structural-models.html#cb17-198" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs, weights = sw, </span></span>
-<span id="cb17-199"><a href="ip-weighting-and-marginal-structural-models.html#cb17-199" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
-<span id="cb17-200"><a href="ip-weighting-and-marginal-structural-models.html#cb17-200" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-201"><a href="ip-weighting-and-marginal-structural-models.html#cb17-201" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
-<span id="cb17-202"><a href="ip-weighting-and-marginal-structural-models.html#cb17-202" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err Wald Pr(&gt;|W|)    </span></span>
-<span id="cb17-203"><a href="ip-weighting-and-marginal-structural-models.html#cb17-203" tabindex="-1"></a><span class="co">#&gt; (Intercept)    1.662   0.233 51.0  9.3e-13 ***</span></span>
-<span id="cb17-204"><a href="ip-weighting-and-marginal-structural-models.html#cb17-204" tabindex="-1"></a><span class="co">#&gt; qsmk           3.496   0.526 44.2  2.9e-11 ***</span></span>
-<span id="cb17-205"><a href="ip-weighting-and-marginal-structural-models.html#cb17-205" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb17-206"><a href="ip-weighting-and-marginal-structural-models.html#cb17-206" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb17-207"><a href="ip-weighting-and-marginal-structural-models.html#cb17-207" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-208"><a href="ip-weighting-and-marginal-structural-models.html#cb17-208" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
-<span id="cb17-209"><a href="ip-weighting-and-marginal-structural-models.html#cb17-209" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
-<span id="cb17-210"><a href="ip-weighting-and-marginal-structural-models.html#cb17-210" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb17-211"><a href="ip-weighting-and-marginal-structural-models.html#cb17-211" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
-<span id="cb17-212"><a href="ip-weighting-and-marginal-structural-models.html#cb17-212" tabindex="-1"></a><span class="co">#&gt; (Intercept)     61.8    3.83</span></span>
-<span id="cb17-213"><a href="ip-weighting-and-marginal-structural-models.html#cb17-213" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span>
-<span id="cb17-214"><a href="ip-weighting-and-marginal-structural-models.html#cb17-214" tabindex="-1"></a></span>
-<span id="cb17-215"><a href="ip-weighting-and-marginal-structural-models.html#cb17-215" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw)</span>
-<span id="cb17-216"><a href="ip-weighting-and-marginal-structural-models.html#cb17-216" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw))[, <span class="dv">2</span>]</span>
-<span id="cb17-217"><a href="ip-weighting-and-marginal-structural-models.html#cb17-217" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb17-218"><a href="ip-weighting-and-marginal-structural-models.html#cb17-218" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
-<span id="cb17-219"><a href="ip-weighting-and-marginal-structural-models.html#cb17-219" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
-<span id="cb17-220"><a href="ip-weighting-and-marginal-structural-models.html#cb17-220" tabindex="-1"></a><span class="co">#&gt;             beta  lcl  ucl</span></span>
-<span id="cb17-221"><a href="ip-weighting-and-marginal-structural-models.html#cb17-221" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.66 1.21 2.12</span></span>
-<span id="cb17-222"><a href="ip-weighting-and-marginal-structural-models.html#cb17-222" tabindex="-1"></a><span class="co">#&gt; qsmk        3.50 2.47 4.53</span></span></code></pre></div>
+<div class="sourceCode" id="cb67"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb67-1"><a href="ip-weighting-and-marginal-structural-models.html#cb67-1" tabindex="-1"></a><span class="fu">table</span>(nhefs<span class="sc">$</span>qsmk, nhefs<span class="sc">$</span>cens)</span>
+<span id="cb67-2"><a href="ip-weighting-and-marginal-structural-models.html#cb67-2" tabindex="-1"></a><span class="co">#&gt;    </span></span>
+<span id="cb67-3"><a href="ip-weighting-and-marginal-structural-models.html#cb67-3" tabindex="-1"></a><span class="co">#&gt;        0    1</span></span>
+<span id="cb67-4"><a href="ip-weighting-and-marginal-structural-models.html#cb67-4" tabindex="-1"></a><span class="co">#&gt;   0 1163   38</span></span>
+<span id="cb67-5"><a href="ip-weighting-and-marginal-structural-models.html#cb67-5" tabindex="-1"></a><span class="co">#&gt;   1  403   25</span></span></code></pre></div>
+<div class="sourceCode" id="cb68"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb68-1"><a href="ip-weighting-and-marginal-structural-models.html#cb68-1" tabindex="-1"></a></span>
+<span id="cb68-2"><a href="ip-weighting-and-marginal-structural-models.html#cb68-2" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>),]<span class="sc">$</span>wt71)</span>
+<span id="cb68-3"><a href="ip-weighting-and-marginal-structural-models.html#cb68-3" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb68-4"><a href="ip-weighting-and-marginal-structural-models.html#cb68-4" tabindex="-1"></a><span class="co">#&gt;    39.6    59.5    69.2    70.8    79.8   151.7</span></span></code></pre></div>
+<div class="sourceCode" id="cb69"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb69-1"><a href="ip-weighting-and-marginal-structural-models.html#cb69-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">1</span>),]<span class="sc">$</span>wt71)</span>
+<span id="cb69-2"><a href="ip-weighting-and-marginal-structural-models.html#cb69-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb69-3"><a href="ip-weighting-and-marginal-structural-models.html#cb69-3" tabindex="-1"></a><span class="co">#&gt;    36.2    63.1    72.1    76.6    87.9   169.2</span></span></code></pre></div>
+<div class="sourceCode" id="cb70"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb70-1"><a href="ip-weighting-and-marginal-structural-models.html#cb70-1" tabindex="-1"></a></span>
+<span id="cb70-2"><a href="ip-weighting-and-marginal-structural-models.html#cb70-2" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for A</span></span>
+<span id="cb70-3"><a href="ip-weighting-and-marginal-structural-models.html#cb70-3" tabindex="-1"></a>denom.fit <span class="ot">&lt;-</span></span>
+<span id="cb70-4"><a href="ip-weighting-and-marginal-structural-models.html#cb70-4" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
+<span id="cb70-5"><a href="ip-weighting-and-marginal-structural-models.html#cb70-5" tabindex="-1"></a>    qsmk <span class="sc">~</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span> <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb70-6"><a href="ip-weighting-and-marginal-structural-models.html#cb70-6" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb70-7"><a href="ip-weighting-and-marginal-structural-models.html#cb70-7" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb70-8"><a href="ip-weighting-and-marginal-structural-models.html#cb70-8" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb70-9"><a href="ip-weighting-and-marginal-structural-models.html#cb70-9" tabindex="-1"></a>    <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb70-10"><a href="ip-weighting-and-marginal-structural-models.html#cb70-10" tabindex="-1"></a>    <span class="at">data =</span> nhefs</span>
+<span id="cb70-11"><a href="ip-weighting-and-marginal-structural-models.html#cb70-11" tabindex="-1"></a>  )</span>
+<span id="cb70-12"><a href="ip-weighting-and-marginal-structural-models.html#cb70-12" tabindex="-1"></a><span class="fu">summary</span>(denom.fit)</span>
+<span id="cb70-13"><a href="ip-weighting-and-marginal-structural-models.html#cb70-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb70-14"><a href="ip-weighting-and-marginal-structural-models.html#cb70-14" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb70-15"><a href="ip-weighting-and-marginal-structural-models.html#cb70-15" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + </span></span>
+<span id="cb70-16"><a href="ip-weighting-and-marginal-structural-models.html#cb70-16" tabindex="-1"></a><span class="co">#&gt;     I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + </span></span>
+<span id="cb70-17"><a href="ip-weighting-and-marginal-structural-models.html#cb70-17" tabindex="-1"></a><span class="co">#&gt;     smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb70-18"><a href="ip-weighting-and-marginal-structural-models.html#cb70-18" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71^2), family = binomial(), data = nhefs)</span></span>
+<span id="cb70-19"><a href="ip-weighting-and-marginal-structural-models.html#cb70-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb70-20"><a href="ip-weighting-and-marginal-structural-models.html#cb70-20" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb70-21"><a href="ip-weighting-and-marginal-structural-models.html#cb70-21" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb70-22"><a href="ip-weighting-and-marginal-structural-models.html#cb70-22" tabindex="-1"></a><span class="co">#&gt; (Intercept)           -1.988902   1.241279   -1.60  0.10909    </span></span>
+<span id="cb70-23"><a href="ip-weighting-and-marginal-structural-models.html#cb70-23" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1       -0.507522   0.148232   -3.42  0.00062 ***</span></span>
+<span id="cb70-24"><a href="ip-weighting-and-marginal-structural-models.html#cb70-24" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.850231   0.205872   -4.13  3.6e-05 ***</span></span>
+<span id="cb70-25"><a href="ip-weighting-and-marginal-structural-models.html#cb70-25" tabindex="-1"></a><span class="co">#&gt; age                    0.103013   0.048900    2.11  0.03515 *  </span></span>
+<span id="cb70-26"><a href="ip-weighting-and-marginal-structural-models.html#cb70-26" tabindex="-1"></a><span class="co">#&gt; I(age^2)              -0.000605   0.000507   -1.19  0.23297    </span></span>
+<span id="cb70-27"><a href="ip-weighting-and-marginal-structural-models.html#cb70-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.098320   0.190655   -0.52  0.60607    </span></span>
+<span id="cb70-28"><a href="ip-weighting-and-marginal-structural-models.html#cb70-28" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3  0.015699   0.170714    0.09  0.92673    </span></span>
+<span id="cb70-29"><a href="ip-weighting-and-marginal-structural-models.html#cb70-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4 -0.042526   0.264276   -0.16  0.87216    </span></span>
+<span id="cb70-30"><a href="ip-weighting-and-marginal-structural-models.html#cb70-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5  0.379663   0.220395    1.72  0.08495 .  </span></span>
+<span id="cb70-31"><a href="ip-weighting-and-marginal-structural-models.html#cb70-31" tabindex="-1"></a><span class="co">#&gt; smokeintensity        -0.065156   0.014759   -4.41  1.0e-05 ***</span></span>
+<span id="cb70-32"><a href="ip-weighting-and-marginal-structural-models.html#cb70-32" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)    0.000846   0.000276    3.07  0.00216 ** </span></span>
+<span id="cb70-33"><a href="ip-weighting-and-marginal-structural-models.html#cb70-33" tabindex="-1"></a><span class="co">#&gt; smokeyrs              -0.073371   0.026996   -2.72  0.00657 ** </span></span>
+<span id="cb70-34"><a href="ip-weighting-and-marginal-structural-models.html#cb70-34" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)          0.000838   0.000443    1.89  0.05867 .  </span></span>
+<span id="cb70-35"><a href="ip-weighting-and-marginal-structural-models.html#cb70-35" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1   0.291412   0.173554    1.68  0.09314 .  </span></span>
+<span id="cb70-36"><a href="ip-weighting-and-marginal-structural-models.html#cb70-36" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2   0.355052   0.179929    1.97  0.04846 *  </span></span>
+<span id="cb70-37"><a href="ip-weighting-and-marginal-structural-models.html#cb70-37" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1     0.010875   0.129832    0.08  0.93324    </span></span>
+<span id="cb70-38"><a href="ip-weighting-and-marginal-structural-models.html#cb70-38" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.068312   0.208727    0.33  0.74346    </span></span>
+<span id="cb70-39"><a href="ip-weighting-and-marginal-structural-models.html#cb70-39" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.012848   0.022283   -0.58  0.56423    </span></span>
+<span id="cb70-40"><a href="ip-weighting-and-marginal-structural-models.html#cb70-40" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000121   0.000135    0.89  0.37096    </span></span>
+<span id="cb70-41"><a href="ip-weighting-and-marginal-structural-models.html#cb70-41" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb70-42"><a href="ip-weighting-and-marginal-structural-models.html#cb70-42" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb70-43"><a href="ip-weighting-and-marginal-structural-models.html#cb70-43" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb70-44"><a href="ip-weighting-and-marginal-structural-models.html#cb70-44" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb70-45"><a href="ip-weighting-and-marginal-structural-models.html#cb70-45" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb70-46"><a href="ip-weighting-and-marginal-structural-models.html#cb70-46" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
+<span id="cb70-47"><a href="ip-weighting-and-marginal-structural-models.html#cb70-47" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1766.7  on 1610  degrees of freedom</span></span>
+<span id="cb70-48"><a href="ip-weighting-and-marginal-structural-models.html#cb70-48" tabindex="-1"></a><span class="co">#&gt; AIC: 1805</span></span>
+<span id="cb70-49"><a href="ip-weighting-and-marginal-structural-models.html#cb70-49" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb70-50"><a href="ip-weighting-and-marginal-structural-models.html#cb70-50" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb71"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb71-1"><a href="ip-weighting-and-marginal-structural-models.html#cb71-1" tabindex="-1"></a></span>
+<span id="cb71-2"><a href="ip-weighting-and-marginal-structural-models.html#cb71-2" tabindex="-1"></a>pd.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(denom.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb71-3"><a href="ip-weighting-and-marginal-structural-models.html#cb71-3" tabindex="-1"></a></span>
+<span id="cb71-4"><a href="ip-weighting-and-marginal-structural-models.html#cb71-4" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights for A</span></span>
+<span id="cb71-5"><a href="ip-weighting-and-marginal-structural-models.html#cb71-5" tabindex="-1"></a>numer.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> <span class="dv">1</span>, <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs)</span>
+<span id="cb71-6"><a href="ip-weighting-and-marginal-structural-models.html#cb71-6" tabindex="-1"></a><span class="fu">summary</span>(numer.fit)</span>
+<span id="cb71-7"><a href="ip-weighting-and-marginal-structural-models.html#cb71-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb71-8"><a href="ip-weighting-and-marginal-structural-models.html#cb71-8" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb71-9"><a href="ip-weighting-and-marginal-structural-models.html#cb71-9" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs)</span></span>
+<span id="cb71-10"><a href="ip-weighting-and-marginal-structural-models.html#cb71-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb71-11"><a href="ip-weighting-and-marginal-structural-models.html#cb71-11" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb71-12"><a href="ip-weighting-and-marginal-structural-models.html#cb71-12" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb71-13"><a href="ip-weighting-and-marginal-structural-models.html#cb71-13" tabindex="-1"></a><span class="co">#&gt; (Intercept)  -1.0318     0.0563   -18.3   &lt;2e-16 ***</span></span>
+<span id="cb71-14"><a href="ip-weighting-and-marginal-structural-models.html#cb71-14" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb71-15"><a href="ip-weighting-and-marginal-structural-models.html#cb71-15" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb71-16"><a href="ip-weighting-and-marginal-structural-models.html#cb71-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb71-17"><a href="ip-weighting-and-marginal-structural-models.html#cb71-17" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb71-18"><a href="ip-weighting-and-marginal-structural-models.html#cb71-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb71-19"><a href="ip-weighting-and-marginal-structural-models.html#cb71-19" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
+<span id="cb71-20"><a href="ip-weighting-and-marginal-structural-models.html#cb71-20" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1876.3  on 1628  degrees of freedom</span></span>
+<span id="cb71-21"><a href="ip-weighting-and-marginal-structural-models.html#cb71-21" tabindex="-1"></a><span class="co">#&gt; AIC: 1878</span></span>
+<span id="cb71-22"><a href="ip-weighting-and-marginal-structural-models.html#cb71-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb71-23"><a href="ip-weighting-and-marginal-structural-models.html#cb71-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb72"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb72-1"><a href="ip-weighting-and-marginal-structural-models.html#cb72-1" tabindex="-1"></a>pn.qsmk <span class="ot">&lt;-</span> <span class="fu">predict</span>(numer.fit, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb72-2"><a href="ip-weighting-and-marginal-structural-models.html#cb72-2" tabindex="-1"></a></span>
+<span id="cb72-3"><a href="ip-weighting-and-marginal-structural-models.html#cb72-3" tabindex="-1"></a><span class="co"># estimation of denominator of ip weights for C</span></span>
+<span id="cb72-4"><a href="ip-weighting-and-marginal-structural-models.html#cb72-4" tabindex="-1"></a>denom.cens <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
+<span id="cb72-5"><a href="ip-weighting-and-marginal-structural-models.html#cb72-5" tabindex="-1"></a>  cens <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk) <span class="sc">+</span> <span class="fu">as.factor</span>(sex) <span class="sc">+</span></span>
+<span id="cb72-6"><a href="ip-weighting-and-marginal-structural-models.html#cb72-6" tabindex="-1"></a>    <span class="fu">as.factor</span>(race) <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb72-7"><a href="ip-weighting-and-marginal-structural-models.html#cb72-7" tabindex="-1"></a>    <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb72-8"><a href="ip-weighting-and-marginal-structural-models.html#cb72-8" tabindex="-1"></a>    <span class="fu">I</span>(smokeintensity <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">^</span> <span class="dv">2</span>) <span class="sc">+</span></span>
+<span id="cb72-9"><a href="ip-weighting-and-marginal-structural-models.html#cb72-9" tabindex="-1"></a>    <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">^</span> <span class="dv">2</span>),</span>
+<span id="cb72-10"><a href="ip-weighting-and-marginal-structural-models.html#cb72-10" tabindex="-1"></a>  <span class="at">family =</span> <span class="fu">binomial</span>(),</span>
+<span id="cb72-11"><a href="ip-weighting-and-marginal-structural-models.html#cb72-11" tabindex="-1"></a>  <span class="at">data =</span> nhefs</span>
+<span id="cb72-12"><a href="ip-weighting-and-marginal-structural-models.html#cb72-12" tabindex="-1"></a>)</span>
+<span id="cb72-13"><a href="ip-weighting-and-marginal-structural-models.html#cb72-13" tabindex="-1"></a><span class="fu">summary</span>(denom.cens)</span>
+<span id="cb72-14"><a href="ip-weighting-and-marginal-structural-models.html#cb72-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb72-15"><a href="ip-weighting-and-marginal-structural-models.html#cb72-15" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb72-16"><a href="ip-weighting-and-marginal-structural-models.html#cb72-16" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + </span></span>
+<span id="cb72-17"><a href="ip-weighting-and-marginal-structural-models.html#cb72-17" tabindex="-1"></a><span class="co">#&gt;     age + I(age^2) + as.factor(education) + smokeintensity + </span></span>
+<span id="cb72-18"><a href="ip-weighting-and-marginal-structural-models.html#cb72-18" tabindex="-1"></a><span class="co">#&gt;     I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + </span></span>
+<span id="cb72-19"><a href="ip-weighting-and-marginal-structural-models.html#cb72-19" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71^2), family = binomial(), </span></span>
+<span id="cb72-20"><a href="ip-weighting-and-marginal-structural-models.html#cb72-20" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
+<span id="cb72-21"><a href="ip-weighting-and-marginal-structural-models.html#cb72-21" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb72-22"><a href="ip-weighting-and-marginal-structural-models.html#cb72-22" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb72-23"><a href="ip-weighting-and-marginal-structural-models.html#cb72-23" tabindex="-1"></a><span class="co">#&gt;                        Estimate Std. Error z value Pr(&gt;|z|)   </span></span>
+<span id="cb72-24"><a href="ip-weighting-and-marginal-structural-models.html#cb72-24" tabindex="-1"></a><span class="co">#&gt; (Intercept)            4.014466   2.576106    1.56   0.1192   </span></span>
+<span id="cb72-25"><a href="ip-weighting-and-marginal-structural-models.html#cb72-25" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1       0.516867   0.287716    1.80   0.0724 . </span></span>
+<span id="cb72-26"><a href="ip-weighting-and-marginal-structural-models.html#cb72-26" tabindex="-1"></a><span class="co">#&gt; as.factor(sex)1        0.057313   0.330278    0.17   0.8622   </span></span>
+<span id="cb72-27"><a href="ip-weighting-and-marginal-structural-models.html#cb72-27" tabindex="-1"></a><span class="co">#&gt; as.factor(race)1      -0.012271   0.452489   -0.03   0.9784   </span></span>
+<span id="cb72-28"><a href="ip-weighting-and-marginal-structural-models.html#cb72-28" tabindex="-1"></a><span class="co">#&gt; age                   -0.269729   0.117465   -2.30   0.0217 * </span></span>
+<span id="cb72-29"><a href="ip-weighting-and-marginal-structural-models.html#cb72-29" tabindex="-1"></a><span class="co">#&gt; I(age^2)               0.002884   0.001114    2.59   0.0096 **</span></span>
+<span id="cb72-30"><a href="ip-weighting-and-marginal-structural-models.html#cb72-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2 -0.440788   0.419399   -1.05   0.2933   </span></span>
+<span id="cb72-31"><a href="ip-weighting-and-marginal-structural-models.html#cb72-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3 -0.164688   0.370547   -0.44   0.6567   </span></span>
+<span id="cb72-32"><a href="ip-weighting-and-marginal-structural-models.html#cb72-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4  0.138447   0.569797    0.24   0.8080   </span></span>
+<span id="cb72-33"><a href="ip-weighting-and-marginal-structural-models.html#cb72-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5 -0.382382   0.560181   -0.68   0.4949   </span></span>
+<span id="cb72-34"><a href="ip-weighting-and-marginal-structural-models.html#cb72-34" tabindex="-1"></a><span class="co">#&gt; smokeintensity         0.015712   0.034732    0.45   0.6510   </span></span>
+<span id="cb72-35"><a href="ip-weighting-and-marginal-structural-models.html#cb72-35" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity^2)   -0.000113   0.000606   -0.19   0.8517   </span></span>
+<span id="cb72-36"><a href="ip-weighting-and-marginal-structural-models.html#cb72-36" tabindex="-1"></a><span class="co">#&gt; smokeyrs               0.078597   0.074958    1.05   0.2944   </span></span>
+<span id="cb72-37"><a href="ip-weighting-and-marginal-structural-models.html#cb72-37" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs^2)         -0.000557   0.001032   -0.54   0.5894   </span></span>
+<span id="cb72-38"><a href="ip-weighting-and-marginal-structural-models.html#cb72-38" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1  -0.971471   0.387810   -2.51   0.0122 * </span></span>
+<span id="cb72-39"><a href="ip-weighting-and-marginal-structural-models.html#cb72-39" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2  -0.583989   0.372313   -1.57   0.1168   </span></span>
+<span id="cb72-40"><a href="ip-weighting-and-marginal-structural-models.html#cb72-40" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1    -0.247479   0.325455   -0.76   0.4470   </span></span>
+<span id="cb72-41"><a href="ip-weighting-and-marginal-structural-models.html#cb72-41" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2     0.706583   0.396458    1.78   0.0747 . </span></span>
+<span id="cb72-42"><a href="ip-weighting-and-marginal-structural-models.html#cb72-42" tabindex="-1"></a><span class="co">#&gt; wt71                  -0.087887   0.040012   -2.20   0.0281 * </span></span>
+<span id="cb72-43"><a href="ip-weighting-and-marginal-structural-models.html#cb72-43" tabindex="-1"></a><span class="co">#&gt; I(wt71^2)              0.000635   0.000226    2.81   0.0049 **</span></span>
+<span id="cb72-44"><a href="ip-weighting-and-marginal-structural-models.html#cb72-44" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb72-45"><a href="ip-weighting-and-marginal-structural-models.html#cb72-45" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb72-46"><a href="ip-weighting-and-marginal-structural-models.html#cb72-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb72-47"><a href="ip-weighting-and-marginal-structural-models.html#cb72-47" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb72-48"><a href="ip-weighting-and-marginal-structural-models.html#cb72-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb72-49"><a href="ip-weighting-and-marginal-structural-models.html#cb72-49" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
+<span id="cb72-50"><a href="ip-weighting-and-marginal-structural-models.html#cb72-50" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 465.36  on 1609  degrees of freedom</span></span>
+<span id="cb72-51"><a href="ip-weighting-and-marginal-structural-models.html#cb72-51" tabindex="-1"></a><span class="co">#&gt; AIC: 505.4</span></span>
+<span id="cb72-52"><a href="ip-weighting-and-marginal-structural-models.html#cb72-52" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb72-53"><a href="ip-weighting-and-marginal-structural-models.html#cb72-53" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 7</span></span></code></pre></div>
+<div class="sourceCode" id="cb73"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb73-1"><a href="ip-weighting-and-marginal-structural-models.html#cb73-1" tabindex="-1"></a></span>
+<span id="cb73-2"><a href="ip-weighting-and-marginal-structural-models.html#cb73-2" tabindex="-1"></a>pd.cens <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(denom.cens, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb73-3"><a href="ip-weighting-and-marginal-structural-models.html#cb73-3" tabindex="-1"></a></span>
+<span id="cb73-4"><a href="ip-weighting-and-marginal-structural-models.html#cb73-4" tabindex="-1"></a><span class="co"># estimation of numerator of ip weights for C</span></span>
+<span id="cb73-5"><a href="ip-weighting-and-marginal-structural-models.html#cb73-5" tabindex="-1"></a>numer.cens <span class="ot">&lt;-</span></span>
+<span id="cb73-6"><a href="ip-weighting-and-marginal-structural-models.html#cb73-6" tabindex="-1"></a>  <span class="fu">glm</span>(cens <span class="sc">~</span> <span class="fu">as.factor</span>(qsmk), <span class="at">family =</span> <span class="fu">binomial</span>(), <span class="at">data =</span> nhefs)</span>
+<span id="cb73-7"><a href="ip-weighting-and-marginal-structural-models.html#cb73-7" tabindex="-1"></a><span class="fu">summary</span>(numer.cens)</span>
+<span id="cb73-8"><a href="ip-weighting-and-marginal-structural-models.html#cb73-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb73-9"><a href="ip-weighting-and-marginal-structural-models.html#cb73-9" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb73-10"><a href="ip-weighting-and-marginal-structural-models.html#cb73-10" tabindex="-1"></a><span class="co">#&gt; glm(formula = cens ~ as.factor(qsmk), family = binomial(), data = nhefs)</span></span>
+<span id="cb73-11"><a href="ip-weighting-and-marginal-structural-models.html#cb73-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb73-12"><a href="ip-weighting-and-marginal-structural-models.html#cb73-12" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb73-13"><a href="ip-weighting-and-marginal-structural-models.html#cb73-13" tabindex="-1"></a><span class="co">#&gt;                  Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb73-14"><a href="ip-weighting-and-marginal-structural-models.html#cb73-14" tabindex="-1"></a><span class="co">#&gt; (Intercept)        -3.421      0.165  -20.75   &lt;2e-16 ***</span></span>
+<span id="cb73-15"><a href="ip-weighting-and-marginal-structural-models.html#cb73-15" tabindex="-1"></a><span class="co">#&gt; as.factor(qsmk)1    0.641      0.264    2.43    0.015 *  </span></span>
+<span id="cb73-16"><a href="ip-weighting-and-marginal-structural-models.html#cb73-16" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb73-17"><a href="ip-weighting-and-marginal-structural-models.html#cb73-17" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb73-18"><a href="ip-weighting-and-marginal-structural-models.html#cb73-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb73-19"><a href="ip-weighting-and-marginal-structural-models.html#cb73-19" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb73-20"><a href="ip-weighting-and-marginal-structural-models.html#cb73-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb73-21"><a href="ip-weighting-and-marginal-structural-models.html#cb73-21" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 533.36  on 1628  degrees of freedom</span></span>
+<span id="cb73-22"><a href="ip-weighting-and-marginal-structural-models.html#cb73-22" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 527.76  on 1627  degrees of freedom</span></span>
+<span id="cb73-23"><a href="ip-weighting-and-marginal-structural-models.html#cb73-23" tabindex="-1"></a><span class="co">#&gt; AIC: 531.8</span></span>
+<span id="cb73-24"><a href="ip-weighting-and-marginal-structural-models.html#cb73-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb73-25"><a href="ip-weighting-and-marginal-structural-models.html#cb73-25" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 6</span></span></code></pre></div>
+<div class="sourceCode" id="cb74"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb74-1"><a href="ip-weighting-and-marginal-structural-models.html#cb74-1" tabindex="-1"></a>pn.cens <span class="ot">&lt;-</span> <span class="dv">1</span> <span class="sc">-</span> <span class="fu">predict</span>(numer.cens, <span class="at">type =</span> <span class="st">&quot;response&quot;</span>)</span>
+<span id="cb74-2"><a href="ip-weighting-and-marginal-structural-models.html#cb74-2" tabindex="-1"></a></span>
+<span id="cb74-3"><a href="ip-weighting-and-marginal-structural-models.html#cb74-3" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.a <span class="ot">&lt;-</span></span>
+<span id="cb74-4"><a href="ip-weighting-and-marginal-structural-models.html#cb74-4" tabindex="-1"></a>  <span class="fu">ifelse</span>(nhefs<span class="sc">$</span>qsmk <span class="sc">==</span> <span class="dv">0</span>, ((<span class="dv">1</span> <span class="sc">-</span> pn.qsmk) <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">-</span> pd.qsmk)),</span>
+<span id="cb74-5"><a href="ip-weighting-and-marginal-structural-models.html#cb74-5" tabindex="-1"></a>         (pn.qsmk <span class="sc">/</span> pd.qsmk))</span>
+<span id="cb74-6"><a href="ip-weighting-and-marginal-structural-models.html#cb74-6" tabindex="-1"></a>nhefs<span class="sc">$</span>sw.c <span class="ot">&lt;-</span> pn.cens <span class="sc">/</span> pd.cens</span>
+<span id="cb74-7"><a href="ip-weighting-and-marginal-structural-models.html#cb74-7" tabindex="-1"></a>nhefs<span class="sc">$</span>sw <span class="ot">&lt;-</span> nhefs<span class="sc">$</span>sw.c <span class="sc">*</span> nhefs<span class="sc">$</span>sw.a</span>
+<span id="cb74-8"><a href="ip-weighting-and-marginal-structural-models.html#cb74-8" tabindex="-1"></a></span>
+<span id="cb74-9"><a href="ip-weighting-and-marginal-structural-models.html#cb74-9" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.a)</span>
+<span id="cb74-10"><a href="ip-weighting-and-marginal-structural-models.html#cb74-10" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb74-11"><a href="ip-weighting-and-marginal-structural-models.html#cb74-11" tabindex="-1"></a><span class="co">#&gt;    0.33    0.86    0.95    1.00    1.08    4.21</span></span></code></pre></div>
+<div class="sourceCode" id="cb75"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb75-1"><a href="ip-weighting-and-marginal-structural-models.html#cb75-1" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw.a)</span>
+<span id="cb75-2"><a href="ip-weighting-and-marginal-structural-models.html#cb75-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.284</span></span></code></pre></div>
+<div class="sourceCode" id="cb76"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb76-1"><a href="ip-weighting-and-marginal-structural-models.html#cb76-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw.c)</span>
+<span id="cb76-2"><a href="ip-weighting-and-marginal-structural-models.html#cb76-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb76-3"><a href="ip-weighting-and-marginal-structural-models.html#cb76-3" tabindex="-1"></a><span class="co">#&gt;    0.94    0.98    0.99    1.01    1.01    7.58</span></span></code></pre></div>
+<div class="sourceCode" id="cb77"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb77-1"><a href="ip-weighting-and-marginal-structural-models.html#cb77-1" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw.c)</span>
+<span id="cb77-2"><a href="ip-weighting-and-marginal-structural-models.html#cb77-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.178</span></span></code></pre></div>
+<div class="sourceCode" id="cb78"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb78-1"><a href="ip-weighting-and-marginal-structural-models.html#cb78-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>sw)</span>
+<span id="cb78-2"><a href="ip-weighting-and-marginal-structural-models.html#cb78-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb78-3"><a href="ip-weighting-and-marginal-structural-models.html#cb78-3" tabindex="-1"></a><span class="co">#&gt;    0.35    0.86    0.94    1.01    1.08   12.86</span></span></code></pre></div>
+<div class="sourceCode" id="cb79"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb79-1"><a href="ip-weighting-and-marginal-structural-models.html#cb79-1" tabindex="-1"></a><span class="fu">sd</span>(nhefs<span class="sc">$</span>sw)</span>
+<span id="cb79-2"><a href="ip-weighting-and-marginal-structural-models.html#cb79-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.411</span></span></code></pre></div>
+<div class="sourceCode" id="cb80"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb80-1"><a href="ip-weighting-and-marginal-structural-models.html#cb80-1" tabindex="-1"></a></span>
+<span id="cb80-2"><a href="ip-weighting-and-marginal-structural-models.html#cb80-2" tabindex="-1"></a>msm.sw <span class="ot">&lt;-</span> <span class="fu">geeglm</span>(</span>
+<span id="cb80-3"><a href="ip-weighting-and-marginal-structural-models.html#cb80-3" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk,</span>
+<span id="cb80-4"><a href="ip-weighting-and-marginal-structural-models.html#cb80-4" tabindex="-1"></a>  <span class="at">data =</span> nhefs,</span>
+<span id="cb80-5"><a href="ip-weighting-and-marginal-structural-models.html#cb80-5" tabindex="-1"></a>  <span class="at">weights =</span> sw,</span>
+<span id="cb80-6"><a href="ip-weighting-and-marginal-structural-models.html#cb80-6" tabindex="-1"></a>  <span class="at">id =</span> seqn,</span>
+<span id="cb80-7"><a href="ip-weighting-and-marginal-structural-models.html#cb80-7" tabindex="-1"></a>  <span class="at">corstr =</span> <span class="st">&quot;independence&quot;</span></span>
+<span id="cb80-8"><a href="ip-weighting-and-marginal-structural-models.html#cb80-8" tabindex="-1"></a>)</span>
+<span id="cb80-9"><a href="ip-weighting-and-marginal-structural-models.html#cb80-9" tabindex="-1"></a><span class="fu">summary</span>(msm.sw)</span>
+<span id="cb80-10"><a href="ip-weighting-and-marginal-structural-models.html#cb80-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb80-11"><a href="ip-weighting-and-marginal-structural-models.html#cb80-11" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb80-12"><a href="ip-weighting-and-marginal-structural-models.html#cb80-12" tabindex="-1"></a><span class="co">#&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs, weights = sw, </span></span>
+<span id="cb80-13"><a href="ip-weighting-and-marginal-structural-models.html#cb80-13" tabindex="-1"></a><span class="co">#&gt;     id = seqn, corstr = &quot;independence&quot;)</span></span>
+<span id="cb80-14"><a href="ip-weighting-and-marginal-structural-models.html#cb80-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb80-15"><a href="ip-weighting-and-marginal-structural-models.html#cb80-15" tabindex="-1"></a><span class="co">#&gt;  Coefficients:</span></span>
+<span id="cb80-16"><a href="ip-weighting-and-marginal-structural-models.html#cb80-16" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err Wald Pr(&gt;|W|)    </span></span>
+<span id="cb80-17"><a href="ip-weighting-and-marginal-structural-models.html#cb80-17" tabindex="-1"></a><span class="co">#&gt; (Intercept)    1.662   0.233 51.0  9.3e-13 ***</span></span>
+<span id="cb80-18"><a href="ip-weighting-and-marginal-structural-models.html#cb80-18" tabindex="-1"></a><span class="co">#&gt; qsmk           3.496   0.526 44.2  2.9e-11 ***</span></span>
+<span id="cb80-19"><a href="ip-weighting-and-marginal-structural-models.html#cb80-19" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb80-20"><a href="ip-weighting-and-marginal-structural-models.html#cb80-20" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb80-21"><a href="ip-weighting-and-marginal-structural-models.html#cb80-21" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb80-22"><a href="ip-weighting-and-marginal-structural-models.html#cb80-22" tabindex="-1"></a><span class="co">#&gt; Correlation structure = independence </span></span>
+<span id="cb80-23"><a href="ip-weighting-and-marginal-structural-models.html#cb80-23" tabindex="-1"></a><span class="co">#&gt; Estimated Scale Parameters:</span></span>
+<span id="cb80-24"><a href="ip-weighting-and-marginal-structural-models.html#cb80-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb80-25"><a href="ip-weighting-and-marginal-structural-models.html#cb80-25" tabindex="-1"></a><span class="co">#&gt;             Estimate Std.err</span></span>
+<span id="cb80-26"><a href="ip-weighting-and-marginal-structural-models.html#cb80-26" tabindex="-1"></a><span class="co">#&gt; (Intercept)     61.8    3.83</span></span>
+<span id="cb80-27"><a href="ip-weighting-and-marginal-structural-models.html#cb80-27" tabindex="-1"></a><span class="co">#&gt; Number of clusters:   1566  Maximum cluster size: 1</span></span></code></pre></div>
+<div class="sourceCode" id="cb81"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb81-1"><a href="ip-weighting-and-marginal-structural-models.html#cb81-1" tabindex="-1"></a></span>
+<span id="cb81-2"><a href="ip-weighting-and-marginal-structural-models.html#cb81-2" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">coef</span>(msm.sw)</span>
+<span id="cb81-3"><a href="ip-weighting-and-marginal-structural-models.html#cb81-3" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">coef</span>(<span class="fu">summary</span>(msm.sw))[, <span class="dv">2</span>]</span>
+<span id="cb81-4"><a href="ip-weighting-and-marginal-structural-models.html#cb81-4" tabindex="-1"></a>lcl <span class="ot">&lt;-</span> beta <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb81-5"><a href="ip-weighting-and-marginal-structural-models.html#cb81-5" tabindex="-1"></a>ucl <span class="ot">&lt;-</span> beta <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> SE</span>
+<span id="cb81-6"><a href="ip-weighting-and-marginal-structural-models.html#cb81-6" tabindex="-1"></a><span class="fu">cbind</span>(beta, lcl, ucl)</span>
+<span id="cb81-7"><a href="ip-weighting-and-marginal-structural-models.html#cb81-7" tabindex="-1"></a><span class="co">#&gt;             beta  lcl  ucl</span></span>
+<span id="cb81-8"><a href="ip-weighting-and-marginal-structural-models.html#cb81-8" tabindex="-1"></a><span class="co">#&gt; (Intercept) 1.66 1.21 2.12</span></span>
+<span id="cb81-9"><a href="ip-weighting-and-marginal-structural-models.html#cb81-9" tabindex="-1"></a><span class="co">#&gt; qsmk        3.50 2.47 4.53</span></span></code></pre></div>
 
 </div>
 </div>
diff --git a/docs/outcome-regression-and-propensity-scores-stata.html b/docs/outcome-regression-and-propensity-scores-stata.html
index 63e9e2e..b72b112 100644
--- a/docs/outcome-regression-and-propensity-scores-stata.html
+++ b/docs/outcome-regression-and-propensity-scores-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="outcome-regression-and-propensity-scores-stata" class="section level1 unnumbered hasAnchor">
 <h1>15. Outcome regression and propensity scores: Stata<a href="outcome-regression-and-propensity-scores-stata.html#outcome-regression-and-propensity-scores-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb102"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb102-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb102-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb219"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb219-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb219-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -324,30 +324,30 @@ <h2>Program 15.1<a href="outcome-regression-and-propensity-scores-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 15.1</li>
 </ul>
-<div class="sourceCode" id="cb104"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb104-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb104-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-2" tabindex="-1"></a></span>
-<span id="cb104-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-3" tabindex="-1"></a><span class="co">/* Generate smoking intensity among smokers product term */</span></span>
-<span id="cb104-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-4" tabindex="-1"></a><span class="kw">gen</span> qsmkintensity = qsmk*smokeintensity</span>
-<span id="cb104-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-5" tabindex="-1"></a></span>
-<span id="cb104-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-6" tabindex="-1"></a>* Regression <span class="kw">on</span> covariates, allowing <span class="kw">for</span> some effect modfication</span>
-<span id="cb104-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-7" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk qsmkintensity <span class="co">///</span></span>
-<span id="cb104-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-8" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity sex race c.age##c.age <span class="co">///</span></span>
-<span id="cb104-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-9" tabindex="-1"></a>  ib(<span class="fu">last</span>).education c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb104-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-10" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb104-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-11" tabindex="-1"></a></span>
-<span id="cb104-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-12" tabindex="-1"></a><span class="co">/* Display the estimated mean difference between quitting and </span></span>
-<span id="cb104-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-13" tabindex="-1"></a><span class="co">  not quitting value when smoke intensity = 5 cigarettes/ day */</span></span>
-<span id="cb104-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-14" tabindex="-1"></a><span class="kw">lincom</span> 1*_b[qsmk] + 5*1*_b[qsmkintensity] </span>
-<span id="cb104-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-15" tabindex="-1"></a></span>
-<span id="cb104-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-16" tabindex="-1"></a><span class="co">/* Display the estimated mean difference between quitting and </span></span>
-<span id="cb104-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-17" tabindex="-1"></a><span class="co">  not quitting value when smoke intensity = 40 cigarettes/ day */</span></span>
-<span id="cb104-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-18" tabindex="-1"></a><span class="kw">lincom</span> 1*_b[qsmk] + 40*1*_b[qsmkintensity]</span>
-<span id="cb104-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-19" tabindex="-1"></a></span>
-<span id="cb104-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-20" tabindex="-1"></a><span class="co">/* Regression on covariates, with no product terms */</span></span>
-<span id="cb104-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-21" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb104-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-22" tabindex="-1"></a>  sex race c.age##c.age <span class="co">///</span></span>
-<span id="cb104-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-23" tabindex="-1"></a>  ib(<span class="fu">last</span>).education c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb104-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb104-24" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span></code></pre></div>
+<div class="sourceCode" id="cb221"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb221-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb221-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-2" tabindex="-1"></a></span>
+<span id="cb221-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-3" tabindex="-1"></a><span class="co">/* Generate smoking intensity among smokers product term */</span></span>
+<span id="cb221-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-4" tabindex="-1"></a><span class="kw">gen</span> qsmkintensity = qsmk*smokeintensity</span>
+<span id="cb221-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-5" tabindex="-1"></a></span>
+<span id="cb221-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-6" tabindex="-1"></a>* Regression <span class="kw">on</span> covariates, allowing <span class="kw">for</span> some effect modfication</span>
+<span id="cb221-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-7" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk qsmkintensity <span class="co">///</span></span>
+<span id="cb221-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-8" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity sex race c.age##c.age <span class="co">///</span></span>
+<span id="cb221-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-9" tabindex="-1"></a>  ib(<span class="fu">last</span>).education c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb221-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-10" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb221-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-11" tabindex="-1"></a></span>
+<span id="cb221-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-12" tabindex="-1"></a><span class="co">/* Display the estimated mean difference between quitting and </span></span>
+<span id="cb221-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-13" tabindex="-1"></a><span class="co">  not quitting value when smoke intensity = 5 cigarettes/ day */</span></span>
+<span id="cb221-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-14" tabindex="-1"></a><span class="kw">lincom</span> 1*_b[qsmk] + 5*1*_b[qsmkintensity] </span>
+<span id="cb221-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-15" tabindex="-1"></a></span>
+<span id="cb221-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-16" tabindex="-1"></a><span class="co">/* Display the estimated mean difference between quitting and </span></span>
+<span id="cb221-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-17" tabindex="-1"></a><span class="co">  not quitting value when smoke intensity = 40 cigarettes/ day */</span></span>
+<span id="cb221-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-18" tabindex="-1"></a><span class="kw">lincom</span> 1*_b[qsmk] + 40*1*_b[qsmkintensity]</span>
+<span id="cb221-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-19" tabindex="-1"></a></span>
+<span id="cb221-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-20" tabindex="-1"></a><span class="co">/* Regression on covariates, with no product terms */</span></span>
+<span id="cb221-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-21" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb221-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-22" tabindex="-1"></a>  sex race c.age##c.age <span class="co">///</span></span>
+<span id="cb221-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-23" tabindex="-1"></a>  ib(<span class="fu">last</span>).education c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb221-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb221-24" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span></code></pre></div>
 <pre><code>      Source |       SS           df       MS      Number of obs   =     1,566
 -------------+----------------------------------   F(20, 1545)     =     13.45
        Model |   14412.558        20    720.6279   Prob &gt; F        =    0.0000
@@ -470,42 +470,42 @@ <h2>Prorgam 15.2<a href="outcome-regression-and-propensity-scores-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 15.2</li>
 </ul>
-<div class="sourceCode" id="cb106"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb106-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb106-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-2" tabindex="-1"></a></span>
-<span id="cb106-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-3" tabindex="-1"></a><span class="co">/*Fit a model for the exposure, quitting smoking*/</span></span>
-<span id="cb106-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb106-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb106-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-6" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb106-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-7" tabindex="-1"></a>  c.wt71##c.wt71 </span>
-<span id="cb106-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-8" tabindex="-1"></a></span>
-<span id="cb106-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-9" tabindex="-1"></a><span class="co">/*Estimate the propensity score, P(Qsmk|Covariates)*/</span></span>
-<span id="cb106-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-10" tabindex="-1"></a><span class="kw">predict</span> ps, pr</span>
-<span id="cb106-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-11" tabindex="-1"></a></span>
-<span id="cb106-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-12" tabindex="-1"></a><span class="co">/*Check the distribution of the propensity score*/</span></span>
-<span id="cb106-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-13" tabindex="-1"></a><span class="kw">bys</span> qsmk: <span class="kw">summarize</span> ps </span>
-<span id="cb106-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-14" tabindex="-1"></a></span>
-<span id="cb106-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-15" tabindex="-1"></a><span class="co">/*Return extreme values of propensity score:</span></span>
-<span id="cb106-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-16" tabindex="-1"></a><span class="co">  note, for Stata versions 15 and above, start by installing extremes*/</span></span>
-<span id="cb106-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-17" tabindex="-1"></a>* <span class="kw">ssc</span> install extremes</span>
-<span id="cb106-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-18" tabindex="-1"></a>extremes ps seqn</span>
-<span id="cb106-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-19" tabindex="-1"></a><span class="kw">bys</span> qsmk: extremes ps seqn</span>
-<span id="cb106-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-20" tabindex="-1"></a></span>
-<span id="cb106-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-21" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-ps, <span class="kw">replace</span></span>
-<span id="cb106-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-22" tabindex="-1"></a></span>
-<span id="cb106-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-23" tabindex="-1"></a><span class="co">/*Plotting the estimated propensity score*/</span></span>
-<span id="cb106-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-24" tabindex="-1"></a><span class="kw">histogram</span> ps, <span class="kw">width</span>(0.05) <span class="bn">start</span>(0.025) <span class="co">///</span></span>
-<span id="cb106-25"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-25" tabindex="-1"></a>  <span class="kw">frequency</span> fcolor(<span class="kw">none</span>) lcolor(<span class="bn">black</span>) <span class="co">///</span></span>
-<span id="cb106-26"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-26" tabindex="-1"></a>  lpattern(solid) addlabel <span class="co">///</span></span>
-<span id="cb106-27"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-27" tabindex="-1"></a>  <span class="bn">addlabopts</span>(<span class="bn">mlabcolor</span>(<span class="bn">black</span>) <span class="bn">mlabposition</span>(12) <span class="co">///</span></span>
-<span id="cb106-28"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-28" tabindex="-1"></a>  <span class="bn">mlabangle</span>(<span class="bn">zero</span>)) <span class="co">///</span></span>
-<span id="cb106-29"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-29" tabindex="-1"></a>  <span class="bn">ytitle</span>(No. Subjects) <span class="kw">ylabel</span>(#4) <span class="co">///</span></span>
-<span id="cb106-30"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-30" tabindex="-1"></a>  <span class="bn">xtitle</span>(Estimated Propensity Score) <span class="kw">xlabel</span>(#15) <span class="co">///</span></span>
-<span id="cb106-31"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-31" tabindex="-1"></a>  <span class="kw">by</span>(, <span class="bn">title</span>(Estimated Propensity Score Distribution) <span class="co">///</span></span>
-<span id="cb106-32"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-32" tabindex="-1"></a>  <span class="bn">subtitle</span>(By Quit Smoking Status)) <span class="co">///</span></span>
-<span id="cb106-33"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-33" tabindex="-1"></a>  <span class="kw">by</span>(, <span class="bn">legend</span>(<span class="kw">off</span>)) <span class="co">///</span></span>
-<span id="cb106-34"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-34" tabindex="-1"></a>  <span class="kw">by</span>(qsmk, style(compact) colfirst) <span class="co">///</span></span>
-<span id="cb106-35"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-35" tabindex="-1"></a>  <span class="bn">subtitle</span>(, <span class="kw">size</span>(small) box bexpand)</span>
-<span id="cb106-36"><a href="outcome-regression-and-propensity-scores-stata.html#cb106-36" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-15-2.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb223"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb223-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb223-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-2" tabindex="-1"></a></span>
+<span id="cb223-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-3" tabindex="-1"></a><span class="co">/*Fit a model for the exposure, quitting smoking*/</span></span>
+<span id="cb223-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb223-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb223-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-6" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb223-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-7" tabindex="-1"></a>  c.wt71##c.wt71 </span>
+<span id="cb223-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-8" tabindex="-1"></a></span>
+<span id="cb223-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-9" tabindex="-1"></a><span class="co">/*Estimate the propensity score, P(Qsmk|Covariates)*/</span></span>
+<span id="cb223-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-10" tabindex="-1"></a><span class="kw">predict</span> ps, pr</span>
+<span id="cb223-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-11" tabindex="-1"></a></span>
+<span id="cb223-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-12" tabindex="-1"></a><span class="co">/*Check the distribution of the propensity score*/</span></span>
+<span id="cb223-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-13" tabindex="-1"></a><span class="kw">bys</span> qsmk: <span class="kw">summarize</span> ps </span>
+<span id="cb223-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-14" tabindex="-1"></a></span>
+<span id="cb223-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-15" tabindex="-1"></a><span class="co">/*Return extreme values of propensity score:</span></span>
+<span id="cb223-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-16" tabindex="-1"></a><span class="co">  note, for Stata versions 15 and above, start by installing extremes*/</span></span>
+<span id="cb223-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-17" tabindex="-1"></a>* <span class="kw">ssc</span> install extremes</span>
+<span id="cb223-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-18" tabindex="-1"></a>extremes ps seqn</span>
+<span id="cb223-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-19" tabindex="-1"></a><span class="kw">bys</span> qsmk: extremes ps seqn</span>
+<span id="cb223-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-20" tabindex="-1"></a></span>
+<span id="cb223-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-21" tabindex="-1"></a><span class="kw">save</span> ./<span class="kw">data</span>/nhefs-ps, <span class="kw">replace</span></span>
+<span id="cb223-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-22" tabindex="-1"></a></span>
+<span id="cb223-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-23" tabindex="-1"></a><span class="co">/*Plotting the estimated propensity score*/</span></span>
+<span id="cb223-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-24" tabindex="-1"></a><span class="kw">histogram</span> ps, <span class="kw">width</span>(0.05) <span class="bn">start</span>(0.025) <span class="co">///</span></span>
+<span id="cb223-25"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-25" tabindex="-1"></a>  <span class="kw">frequency</span> fcolor(<span class="kw">none</span>) lcolor(<span class="bn">black</span>) <span class="co">///</span></span>
+<span id="cb223-26"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-26" tabindex="-1"></a>  lpattern(solid) addlabel <span class="co">///</span></span>
+<span id="cb223-27"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-27" tabindex="-1"></a>  <span class="bn">addlabopts</span>(<span class="bn">mlabcolor</span>(<span class="bn">black</span>) <span class="bn">mlabposition</span>(12) <span class="co">///</span></span>
+<span id="cb223-28"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-28" tabindex="-1"></a>  <span class="bn">mlabangle</span>(<span class="bn">zero</span>)) <span class="co">///</span></span>
+<span id="cb223-29"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-29" tabindex="-1"></a>  <span class="bn">ytitle</span>(No. Subjects) <span class="kw">ylabel</span>(#4) <span class="co">///</span></span>
+<span id="cb223-30"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-30" tabindex="-1"></a>  <span class="bn">xtitle</span>(Estimated Propensity Score) <span class="kw">xlabel</span>(#15) <span class="co">///</span></span>
+<span id="cb223-31"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-31" tabindex="-1"></a>  <span class="kw">by</span>(, <span class="bn">title</span>(Estimated Propensity Score Distribution) <span class="co">///</span></span>
+<span id="cb223-32"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-32" tabindex="-1"></a>  <span class="bn">subtitle</span>(By Quit Smoking Status)) <span class="co">///</span></span>
+<span id="cb223-33"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-33" tabindex="-1"></a>  <span class="kw">by</span>(, <span class="bn">legend</span>(<span class="kw">off</span>)) <span class="co">///</span></span>
+<span id="cb223-34"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-34" tabindex="-1"></a>  <span class="kw">by</span>(qsmk, style(compact) colfirst) <span class="co">///</span></span>
+<span id="cb223-35"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-35" tabindex="-1"></a>  <span class="bn">subtitle</span>(, <span class="kw">size</span>(small) box bexpand)</span>
+<span id="cb223-36"><a href="outcome-regression-and-propensity-scores-stata.html#cb223-36" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> ./figs/stata-fig-15-2.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -893.02712  
 Iteration 1:  Log likelihood = -839.70016  
 Iteration 2:  Log likelihood = -838.45045  
@@ -647,19 +647,19 @@ <h2>Program 15.3<a href="outcome-regression-and-propensity-scores-stata.html#pro
 <li>Section 15.3</li>
 <li>Note: Stata decides borderline cutpoints differently from SAS, so, despite identically distributed propensity scores, the results of regression using deciles are not an exact match with the book.</li>
 </ul>
-<div class="sourceCode" id="cb108"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb108-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-ps, <span class="kw">clear</span></span>
-<span id="cb108-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-2" tabindex="-1"></a></span>
-<span id="cb108-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-3" tabindex="-1"></a><span class="co">/*Calculation of deciles of ps*/</span></span>
-<span id="cb108-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-4" tabindex="-1"></a><span class="kw">xtile</span> ps_dec = ps, nq(10)</span>
-<span id="cb108-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-5" tabindex="-1"></a><span class="kw">by</span> ps_dec, <span class="kw">sort</span>: <span class="kw">summarize</span> ps</span>
-<span id="cb108-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-6" tabindex="-1"></a></span>
-<span id="cb108-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-7" tabindex="-1"></a><span class="co">/*Stratification on PS deciles, allowing for effect modification*/</span></span>
-<span id="cb108-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-8" tabindex="-1"></a><span class="co">/*Note: Stata compares qsmk 0 vs qsmk 1, so the coefficients are reversed </span></span>
-<span id="cb108-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-9" tabindex="-1"></a><span class="co">relative to the book*/</span></span>
-<span id="cb108-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-10" tabindex="-1"></a><span class="kw">by</span> ps_dec: <span class="kw">ttest</span> wt82_71, <span class="kw">by</span>(qsmk)</span>
-<span id="cb108-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-11" tabindex="-1"></a></span>
-<span id="cb108-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-12" tabindex="-1"></a><span class="co">/*Regression on PS deciles, with no product terms*/</span></span>
-<span id="cb108-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb108-13" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk ib(<span class="fu">last</span>).ps_dec</span></code></pre></div>
+<div class="sourceCode" id="cb225"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb225-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-ps, <span class="kw">clear</span></span>
+<span id="cb225-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-2" tabindex="-1"></a></span>
+<span id="cb225-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-3" tabindex="-1"></a><span class="co">/*Calculation of deciles of ps*/</span></span>
+<span id="cb225-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-4" tabindex="-1"></a><span class="kw">xtile</span> ps_dec = ps, nq(10)</span>
+<span id="cb225-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-5" tabindex="-1"></a><span class="kw">by</span> ps_dec, <span class="kw">sort</span>: <span class="kw">summarize</span> ps</span>
+<span id="cb225-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-6" tabindex="-1"></a></span>
+<span id="cb225-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-7" tabindex="-1"></a><span class="co">/*Stratification on PS deciles, allowing for effect modification*/</span></span>
+<span id="cb225-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-8" tabindex="-1"></a><span class="co">/*Note: Stata compares qsmk 0 vs qsmk 1, so the coefficients are reversed </span></span>
+<span id="cb225-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-9" tabindex="-1"></a><span class="co">relative to the book*/</span></span>
+<span id="cb225-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-10" tabindex="-1"></a><span class="kw">by</span> ps_dec: <span class="kw">ttest</span> wt82_71, <span class="kw">by</span>(qsmk)</span>
+<span id="cb225-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-11" tabindex="-1"></a></span>
+<span id="cb225-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-12" tabindex="-1"></a><span class="co">/*Regression on PS deciles, with no product terms*/</span></span>
+<span id="cb225-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb225-13" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk ib(<span class="fu">last</span>).ps_dec</span></code></pre></div>
 <pre><code>-&gt; ps_dec = 1
 
     Variable |        Obs        Mean    Std. dev.       Min        Max
@@ -964,102 +964,102 @@ <h2>Program 15.4<a href="outcome-regression-and-propensity-scores-stata.html#pro
 <li>Data from NHEFS</li>
 <li>Section 15.3</li>
 </ul>
-<div class="sourceCode" id="cb110"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb110-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb110-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-2" tabindex="-1"></a></span>
-<span id="cb110-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-3" tabindex="-1"></a><span class="co">/*Estimate the propensity score*/</span></span>
-<span id="cb110-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb110-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb110-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-6" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
-<span id="cb110-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-7" tabindex="-1"></a>  ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
-<span id="cb110-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-8" tabindex="-1"></a><span class="kw">predict</span> ps, pr</span>
-<span id="cb110-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-9" tabindex="-1"></a></span>
-<span id="cb110-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-10" tabindex="-1"></a><span class="co">/*Expand the dataset for standardization*/</span></span>
-<span id="cb110-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-11" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
-<span id="cb110-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-12" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
-<span id="cb110-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-13" tabindex="-1"></a><span class="kw">replace</span> interv = -1 <span class="kw">if</span> interv2 ==1</span>
-<span id="cb110-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-14" tabindex="-1"></a><span class="kw">drop</span> interv2 </span>
-<span id="cb110-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-15" tabindex="-1"></a><span class="kw">tab</span> interv</span>
-<span id="cb110-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-16" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv != -1</span>
-<span id="cb110-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-17" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv == 0</span>
-<span id="cb110-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-18" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv == 1</span>
-<span id="cb110-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-19" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> qsmk</span>
-<span id="cb110-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-20" tabindex="-1"></a></span>
-<span id="cb110-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-21" tabindex="-1"></a><span class="co">/*Regression on the propensity score, allowing for effect modification*/</span></span>
-<span id="cb110-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-22" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##c.ps</span>
-<span id="cb110-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-23" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
-<span id="cb110-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-24" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
-<span id="cb110-25"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-25" tabindex="-1"></a></span>
-<span id="cb110-26"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-26" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
-<span id="cb110-27"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-27" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb110-28"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-28" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
-<span id="cb110-29"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-29" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb110-30"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-30" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
-<span id="cb110-31"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-31" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb110-32"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-32" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
-<span id="cb110-33"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-33" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
-<span id="cb110-34"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-34" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
-<span id="cb110-35"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-35" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
-<span id="cb110-36"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-36" tabindex="-1"></a></span>
-<span id="cb110-37"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-37" tabindex="-1"></a><span class="co">/*bootstrap program*/</span></span>
-<span id="cb110-38"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-38" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> interv != -1</span>
-<span id="cb110-39"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-39" tabindex="-1"></a><span class="kw">gen</span> meanY_b =.</span>
-<span id="cb110-40"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-40" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">replace</span></span>
-<span id="cb110-41"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-41" tabindex="-1"></a></span>
-<span id="cb110-42"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-42" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz</span>
-<span id="cb110-43"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-43" tabindex="-1"></a></span>
-<span id="cb110-44"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-44" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz, rclass</span>
-<span id="cb110-45"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-45" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">clear</span></span>
-<span id="cb110-46"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-46" tabindex="-1"></a><span class="kw">preserve</span></span>
-<span id="cb110-47"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-47" tabindex="-1"></a><span class="kw">bsample</span> </span>
-<span id="cb110-48"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-48" tabindex="-1"></a><span class="co">/*Create 2 new copies of the data. </span></span>
-<span id="cb110-49"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-49" tabindex="-1"></a><span class="co">Set the outcome AND the exposure to missing in the copies*/</span></span>
-<span id="cb110-50"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-50" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv_b)</span>
-<span id="cb110-51"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-51" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv_b == 0, <span class="kw">generate</span>(interv2_b)</span>
-<span id="cb110-52"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-52" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> interv_b = -1 <span class="kw">if</span> interv2_b ==1</span>
-<span id="cb110-53"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-53" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">drop</span> interv2_b</span>
-<span id="cb110-54"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-54" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv_b != -1</span>
-<span id="cb110-55"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-55" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = . <span class="kw">if</span> interv_b != -1</span>
-<span id="cb110-56"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-56" tabindex="-1"></a></span>
-<span id="cb110-57"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-57" tabindex="-1"></a><span class="co">/*Fit the propensity score in the original data </span></span>
-<span id="cb110-58"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-58" tabindex="-1"></a><span class="co">(where qsmk is not missing) and generate predictions for everyone*/</span></span>
-<span id="cb110-59"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-59" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb110-60"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-60" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
-<span id="cb110-61"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-61" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
-<span id="cb110-62"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-62" tabindex="-1"></a>    c.wt71##c.wt71 </span>
-<span id="cb110-63"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-63" tabindex="-1"></a><span class="kw">predict</span> ps_b, pr</span>
-<span id="cb110-64"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-64" tabindex="-1"></a></span>
-<span id="cb110-65"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-65" tabindex="-1"></a><span class="co">/*Set the exposure to 0 for everyone in copy 0, </span></span>
-<span id="cb110-66"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-66" tabindex="-1"></a><span class="co">and 1 to everyone for copy 1*/</span></span>
-<span id="cb110-67"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-67" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv_b == 0</span>
-<span id="cb110-68"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-68" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv_b == 1</span>
-<span id="cb110-69"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-69" tabindex="-1"></a></span>
-<span id="cb110-70"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-70" tabindex="-1"></a><span class="co">/*Fit the outcome regression in the original data </span></span>
-<span id="cb110-71"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-71" tabindex="-1"></a><span class="co">(where wt82_71 is not missing) and </span></span>
-<span id="cb110-72"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-72" tabindex="-1"></a><span class="co">generate predictions for everyone*/</span></span>
-<span id="cb110-73"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-73" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##c.ps</span>
-<span id="cb110-74"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-74" tabindex="-1"></a><span class="kw">predict</span> predY_b, <span class="kw">xb</span></span>
-<span id="cb110-75"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-75" tabindex="-1"></a></span>
-<span id="cb110-76"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-76" tabindex="-1"></a><span class="co">/*Summarize the predictions in each set of copies*/</span></span>
-<span id="cb110-77"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-77" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 0</span>
-<span id="cb110-78"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-78" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
-<span id="cb110-79"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-79" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 1</span>
-<span id="cb110-80"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-80" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
-<span id="cb110-81"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-81" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
-<span id="cb110-82"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-82" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">drop</span> meanY_b</span>
-<span id="cb110-83"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-83" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb110-84"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-84" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb110-85"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-85" tabindex="-1"></a></span>
-<span id="cb110-86"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-86" tabindex="-1"></a><span class="co">/*Then we use the `simulate` command to run the bootstraps </span></span>
-<span id="cb110-87"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-87" tabindex="-1"></a><span class="co">as many times as we want.</span></span>
-<span id="cb110-88"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-88" tabindex="-1"></a><span class="co">Start with reps(10) to make sure your code runs, </span></span>
-<span id="cb110-89"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-89" tabindex="-1"></a><span class="co">and then change to reps(1000) to generate your final CIs*/</span></span>
-<span id="cb110-90"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-90" tabindex="-1"></a><span class="kw">simulate</span> EY_a0=<span class="fu">r</span>(boot_0) EY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
-<span id="cb110-91"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-91" tabindex="-1"></a>  difference = <span class="fu">r</span>(boot_diff), reps(500) <span class="dv">seed</span>(1): bootstdz</span>
-<span id="cb110-92"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-92" tabindex="-1"></a></span>
-<span id="cb110-93"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-93" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[2..4, 2]&#39;</span>
-<span id="cb110-94"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-94" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pe</span>
-<span id="cb110-95"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-95" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629) </span>
-<span id="cb110-96"><a href="outcome-regression-and-propensity-scores-stata.html#cb110-96" tabindex="-1"></a><span class="kw">estat</span> <span class="kw">bootstrap</span>, <span class="kw">p</span></span></code></pre></div>
+<div class="sourceCode" id="cb227"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb227-1"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb227-2"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-2" tabindex="-1"></a></span>
+<span id="cb227-3"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-3" tabindex="-1"></a><span class="co">/*Estimate the propensity score*/</span></span>
+<span id="cb227-4"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-4" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb227-5"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-5" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb227-6"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-6" tabindex="-1"></a>  c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise <span class="co">///</span></span>
+<span id="cb227-7"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-7" tabindex="-1"></a>  ib(<span class="fu">last</span>).active c.wt71##c.wt71 </span>
+<span id="cb227-8"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-8" tabindex="-1"></a><span class="kw">predict</span> ps, pr</span>
+<span id="cb227-9"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-9" tabindex="-1"></a></span>
+<span id="cb227-10"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-10" tabindex="-1"></a><span class="co">/*Expand the dataset for standardization*/</span></span>
+<span id="cb227-11"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-11" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
+<span id="cb227-12"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-12" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
+<span id="cb227-13"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-13" tabindex="-1"></a><span class="kw">replace</span> interv = -1 <span class="kw">if</span> interv2 ==1</span>
+<span id="cb227-14"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-14" tabindex="-1"></a><span class="kw">drop</span> interv2 </span>
+<span id="cb227-15"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-15" tabindex="-1"></a><span class="kw">tab</span> interv</span>
+<span id="cb227-16"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-16" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv != -1</span>
+<span id="cb227-17"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-17" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv == 0</span>
+<span id="cb227-18"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-18" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv == 1</span>
+<span id="cb227-19"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-19" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> qsmk</span>
+<span id="cb227-20"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-20" tabindex="-1"></a></span>
+<span id="cb227-21"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-21" tabindex="-1"></a><span class="co">/*Regression on the propensity score, allowing for effect modification*/</span></span>
+<span id="cb227-22"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-22" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##c.ps</span>
+<span id="cb227-23"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-23" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
+<span id="cb227-24"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-24" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
+<span id="cb227-25"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-25" tabindex="-1"></a></span>
+<span id="cb227-26"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-26" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
+<span id="cb227-27"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-27" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb227-28"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-28" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
+<span id="cb227-29"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-29" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb227-30"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-30" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
+<span id="cb227-31"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-31" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb227-32"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-32" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
+<span id="cb227-33"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-33" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
+<span id="cb227-34"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-34" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
+<span id="cb227-35"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-35" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
+<span id="cb227-36"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-36" tabindex="-1"></a></span>
+<span id="cb227-37"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-37" tabindex="-1"></a><span class="co">/*bootstrap program*/</span></span>
+<span id="cb227-38"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-38" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> interv != -1</span>
+<span id="cb227-39"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-39" tabindex="-1"></a><span class="kw">gen</span> meanY_b =.</span>
+<span id="cb227-40"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-40" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">replace</span></span>
+<span id="cb227-41"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-41" tabindex="-1"></a></span>
+<span id="cb227-42"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-42" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz</span>
+<span id="cb227-43"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-43" tabindex="-1"></a></span>
+<span id="cb227-44"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-44" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz, rclass</span>
+<span id="cb227-45"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-45" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">clear</span></span>
+<span id="cb227-46"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-46" tabindex="-1"></a><span class="kw">preserve</span></span>
+<span id="cb227-47"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-47" tabindex="-1"></a><span class="kw">bsample</span> </span>
+<span id="cb227-48"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-48" tabindex="-1"></a><span class="co">/*Create 2 new copies of the data. </span></span>
+<span id="cb227-49"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-49" tabindex="-1"></a><span class="co">Set the outcome AND the exposure to missing in the copies*/</span></span>
+<span id="cb227-50"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-50" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv_b)</span>
+<span id="cb227-51"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-51" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv_b == 0, <span class="kw">generate</span>(interv2_b)</span>
+<span id="cb227-52"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-52" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> interv_b = -1 <span class="kw">if</span> interv2_b ==1</span>
+<span id="cb227-53"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-53" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">drop</span> interv2_b</span>
+<span id="cb227-54"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-54" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv_b != -1</span>
+<span id="cb227-55"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-55" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = . <span class="kw">if</span> interv_b != -1</span>
+<span id="cb227-56"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-56" tabindex="-1"></a></span>
+<span id="cb227-57"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-57" tabindex="-1"></a><span class="co">/*Fit the propensity score in the original data </span></span>
+<span id="cb227-58"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-58" tabindex="-1"></a><span class="co">(where qsmk is not missing) and generate predictions for everyone*/</span></span>
+<span id="cb227-59"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-59" tabindex="-1"></a><span class="kw">logit</span> qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb227-60"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-60" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity <span class="co">///</span></span>
+<span id="cb227-61"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-61" tabindex="-1"></a>    c.smokeyrs##c.smokeyrs ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active <span class="co">///</span></span>
+<span id="cb227-62"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-62" tabindex="-1"></a>    c.wt71##c.wt71 </span>
+<span id="cb227-63"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-63" tabindex="-1"></a><span class="kw">predict</span> ps_b, pr</span>
+<span id="cb227-64"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-64" tabindex="-1"></a></span>
+<span id="cb227-65"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-65" tabindex="-1"></a><span class="co">/*Set the exposure to 0 for everyone in copy 0, </span></span>
+<span id="cb227-66"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-66" tabindex="-1"></a><span class="co">and 1 to everyone for copy 1*/</span></span>
+<span id="cb227-67"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-67" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv_b == 0</span>
+<span id="cb227-68"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-68" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv_b == 1</span>
+<span id="cb227-69"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-69" tabindex="-1"></a></span>
+<span id="cb227-70"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-70" tabindex="-1"></a><span class="co">/*Fit the outcome regression in the original data </span></span>
+<span id="cb227-71"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-71" tabindex="-1"></a><span class="co">(where wt82_71 is not missing) and </span></span>
+<span id="cb227-72"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-72" tabindex="-1"></a><span class="co">generate predictions for everyone*/</span></span>
+<span id="cb227-73"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-73" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk##c.ps</span>
+<span id="cb227-74"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-74" tabindex="-1"></a><span class="kw">predict</span> predY_b, <span class="kw">xb</span></span>
+<span id="cb227-75"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-75" tabindex="-1"></a></span>
+<span id="cb227-76"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-76" tabindex="-1"></a><span class="co">/*Summarize the predictions in each set of copies*/</span></span>
+<span id="cb227-77"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-77" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 0</span>
+<span id="cb227-78"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-78" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
+<span id="cb227-79"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-79" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 1</span>
+<span id="cb227-80"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-80" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
+<span id="cb227-81"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-81" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
+<span id="cb227-82"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-82" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">drop</span> meanY_b</span>
+<span id="cb227-83"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-83" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb227-84"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-84" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb227-85"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-85" tabindex="-1"></a></span>
+<span id="cb227-86"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-86" tabindex="-1"></a><span class="co">/*Then we use the `simulate` command to run the bootstraps </span></span>
+<span id="cb227-87"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-87" tabindex="-1"></a><span class="co">as many times as we want.</span></span>
+<span id="cb227-88"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-88" tabindex="-1"></a><span class="co">Start with reps(10) to make sure your code runs, </span></span>
+<span id="cb227-89"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-89" tabindex="-1"></a><span class="co">and then change to reps(1000) to generate your final CIs*/</span></span>
+<span id="cb227-90"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-90" tabindex="-1"></a><span class="kw">simulate</span> EY_a0=<span class="fu">r</span>(boot_0) EY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
+<span id="cb227-91"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-91" tabindex="-1"></a>  difference = <span class="fu">r</span>(boot_diff), reps(500) <span class="dv">seed</span>(1): bootstdz</span>
+<span id="cb227-92"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-92" tabindex="-1"></a></span>
+<span id="cb227-93"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-93" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[2..4, 2]&#39;</span>
+<span id="cb227-94"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-94" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pe</span>
+<span id="cb227-95"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-95" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629) </span>
+<span id="cb227-96"><a href="outcome-regression-and-propensity-scores-stata.html#cb227-96" tabindex="-1"></a><span class="kw">estat</span> <span class="kw">bootstrap</span>, <span class="kw">p</span></span></code></pre></div>
 <pre><code>Iteration 0:  Log likelihood = -893.02712  
 Iteration 1:  Log likelihood = -839.70016  
 Iteration 2:  Log likelihood = -838.45045  
diff --git a/docs/outcome-regression-and-propensity-scores.html b/docs/outcome-regression-and-propensity-scores.html
index 63e30f7..e633213 100644
--- a/docs/outcome-regression-and-propensity-scores.html
+++ b/docs/outcome-regression-and-propensity-scores.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -316,233 +316,233 @@ <h2>Program 15.1<a href="outcome-regression-and-propensity-scores.html#program-1
 <li>Estimating the average causal effect within levels of confounders under the assumption of effect-measure modification by smoking intensity ONLY</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb29"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb29-1"><a href="outcome-regression-and-propensity-scores.html#cb29-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb30"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb30-1"><a href="outcome-regression-and-propensity-scores.html#cb30-1" tabindex="-1"></a><span class="co">#install.packages(&quot;readxl&quot;) # install package if required</span></span>
-<span id="cb30-2"><a href="outcome-regression-and-propensity-scores.html#cb30-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb30-3"><a href="outcome-regression-and-propensity-scores.html#cb30-3" tabindex="-1"></a></span>
-<span id="cb30-4"><a href="outcome-regression-and-propensity-scores.html#cb30-4" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb30-5"><a href="outcome-regression-and-propensity-scores.html#cb30-5" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb30-6"><a href="outcome-regression-and-propensity-scores.html#cb30-6" tabindex="-1"></a></span>
-<span id="cb30-7"><a href="outcome-regression-and-propensity-scores.html#cb30-7" tabindex="-1"></a><span class="co"># regression on covariates, allowing for some effect modification</span></span>
-<span id="cb30-8"><a href="outcome-regression-and-propensity-scores.html#cb30-8" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb30-9"><a href="outcome-regression-and-propensity-scores.html#cb30-9" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb30-10"><a href="outcome-regression-and-propensity-scores.html#cb30-10" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb30-11"><a href="outcome-regression-and-propensity-scores.html#cb30-11" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>smokeintensity), <span class="at">data=</span>nhefs)</span>
-<span id="cb30-12"><a href="outcome-regression-and-propensity-scores.html#cb30-12" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
-<span id="cb30-13"><a href="outcome-regression-and-propensity-scores.html#cb30-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-14"><a href="outcome-regression-and-propensity-scores.html#cb30-14" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb30-15"><a href="outcome-regression-and-propensity-scores.html#cb30-15" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb30-16"><a href="outcome-regression-and-propensity-scores.html#cb30-16" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb30-17"><a href="outcome-regression-and-propensity-scores.html#cb30-17" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb30-18"><a href="outcome-regression-and-propensity-scores.html#cb30-18" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
-<span id="cb30-19"><a href="outcome-regression-and-propensity-scores.html#cb30-19" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
-<span id="cb30-20"><a href="outcome-regression-and-propensity-scores.html#cb30-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-21"><a href="outcome-regression-and-propensity-scores.html#cb30-21" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb30-22"><a href="outcome-regression-and-propensity-scores.html#cb30-22" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb30-23"><a href="outcome-regression-and-propensity-scores.html#cb30-23" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
-<span id="cb30-24"><a href="outcome-regression-and-propensity-scores.html#cb30-24" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
-<span id="cb30-25"><a href="outcome-regression-and-propensity-scores.html#cb30-25" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
-<span id="cb30-26"><a href="outcome-regression-and-propensity-scores.html#cb30-26" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
-<span id="cb30-27"><a href="outcome-regression-and-propensity-scores.html#cb30-27" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
-<span id="cb30-28"><a href="outcome-regression-and-propensity-scores.html#cb30-28" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
-<span id="cb30-29"><a href="outcome-regression-and-propensity-scores.html#cb30-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
-<span id="cb30-30"><a href="outcome-regression-and-propensity-scores.html#cb30-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
-<span id="cb30-31"><a href="outcome-regression-and-propensity-scores.html#cb30-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
-<span id="cb30-32"><a href="outcome-regression-and-propensity-scores.html#cb30-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
-<span id="cb30-33"><a href="outcome-regression-and-propensity-scores.html#cb30-33" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
-<span id="cb30-34"><a href="outcome-regression-and-propensity-scores.html#cb30-34" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
-<span id="cb30-35"><a href="outcome-regression-and-propensity-scores.html#cb30-35" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
-<span id="cb30-36"><a href="outcome-regression-and-propensity-scores.html#cb30-36" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
-<span id="cb30-37"><a href="outcome-regression-and-propensity-scores.html#cb30-37" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
-<span id="cb30-38"><a href="outcome-regression-and-propensity-scores.html#cb30-38" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
-<span id="cb30-39"><a href="outcome-regression-and-propensity-scores.html#cb30-39" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
-<span id="cb30-40"><a href="outcome-regression-and-propensity-scores.html#cb30-40" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
-<span id="cb30-41"><a href="outcome-regression-and-propensity-scores.html#cb30-41" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
-<span id="cb30-42"><a href="outcome-regression-and-propensity-scores.html#cb30-42" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
-<span id="cb30-43"><a href="outcome-regression-and-propensity-scores.html#cb30-43" tabindex="-1"></a><span class="co">#&gt; I(qsmk * smokeintensity)            0.0466628  0.0351448   1.328 0.184463    </span></span>
-<span id="cb30-44"><a href="outcome-regression-and-propensity-scores.html#cb30-44" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb30-45"><a href="outcome-regression-and-propensity-scores.html#cb30-45" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb30-46"><a href="outcome-regression-and-propensity-scores.html#cb30-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-47"><a href="outcome-regression-and-propensity-scores.html#cb30-47" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
-<span id="cb30-48"><a href="outcome-regression-and-propensity-scores.html#cb30-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-49"><a href="outcome-regression-and-propensity-scores.html#cb30-49" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb30-50"><a href="outcome-regression-and-propensity-scores.html#cb30-50" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
-<span id="cb30-51"><a href="outcome-regression-and-propensity-scores.html#cb30-51" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb30-52"><a href="outcome-regression-and-propensity-scores.html#cb30-52" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
-<span id="cb30-53"><a href="outcome-regression-and-propensity-scores.html#cb30-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-54"><a href="outcome-regression-and-propensity-scores.html#cb30-54" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb30-55"><a href="outcome-regression-and-propensity-scores.html#cb30-55" tabindex="-1"></a></span>
-<span id="cb30-56"><a href="outcome-regression-and-propensity-scores.html#cb30-56" tabindex="-1"></a><span class="co"># (step 1) build the contrast matrix with all zeros</span></span>
-<span id="cb30-57"><a href="outcome-regression-and-propensity-scores.html#cb30-57" tabindex="-1"></a><span class="co"># this function builds the blank matrix</span></span>
-<span id="cb30-58"><a href="outcome-regression-and-propensity-scores.html#cb30-58" tabindex="-1"></a><span class="co"># install.packages(&quot;multcomp&quot;) # install packages if necessary</span></span>
-<span id="cb30-59"><a href="outcome-regression-and-propensity-scores.html#cb30-59" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;multcomp&quot;</span>)</span>
-<span id="cb30-60"><a href="outcome-regression-and-propensity-scores.html#cb30-60" tabindex="-1"></a><span class="co">#&gt; Loading required package: mvtnorm</span></span>
-<span id="cb30-61"><a href="outcome-regression-and-propensity-scores.html#cb30-61" tabindex="-1"></a><span class="co">#&gt; Loading required package: survival</span></span>
-<span id="cb30-62"><a href="outcome-regression-and-propensity-scores.html#cb30-62" tabindex="-1"></a><span class="co">#&gt; Loading required package: TH.data</span></span>
-<span id="cb30-63"><a href="outcome-regression-and-propensity-scores.html#cb30-63" tabindex="-1"></a><span class="co">#&gt; Loading required package: MASS</span></span>
-<span id="cb30-64"><a href="outcome-regression-and-propensity-scores.html#cb30-64" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-65"><a href="outcome-regression-and-propensity-scores.html#cb30-65" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;TH.data&#39;</span></span>
-<span id="cb30-66"><a href="outcome-regression-and-propensity-scores.html#cb30-66" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:MASS&#39;:</span></span>
-<span id="cb30-67"><a href="outcome-regression-and-propensity-scores.html#cb30-67" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-68"><a href="outcome-regression-and-propensity-scores.html#cb30-68" tabindex="-1"></a><span class="co">#&gt;     geyser</span></span>
-<span id="cb30-69"><a href="outcome-regression-and-propensity-scores.html#cb30-69" tabindex="-1"></a>makeContrastMatrix <span class="ot">&lt;-</span> <span class="cf">function</span>(model, nrow, names) {</span>
-<span id="cb30-70"><a href="outcome-regression-and-propensity-scores.html#cb30-70" tabindex="-1"></a>  m <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="dv">0</span>, <span class="at">nrow =</span> nrow, <span class="at">ncol =</span> <span class="fu">length</span>(<span class="fu">coef</span>(model)))</span>
-<span id="cb30-71"><a href="outcome-regression-and-propensity-scores.html#cb30-71" tabindex="-1"></a>  <span class="fu">colnames</span>(m) <span class="ot">&lt;-</span> <span class="fu">names</span>(<span class="fu">coef</span>(model))</span>
-<span id="cb30-72"><a href="outcome-regression-and-propensity-scores.html#cb30-72" tabindex="-1"></a>  <span class="fu">rownames</span>(m) <span class="ot">&lt;-</span> names</span>
-<span id="cb30-73"><a href="outcome-regression-and-propensity-scores.html#cb30-73" tabindex="-1"></a>  <span class="fu">return</span>(m)</span>
-<span id="cb30-74"><a href="outcome-regression-and-propensity-scores.html#cb30-74" tabindex="-1"></a>}</span>
-<span id="cb30-75"><a href="outcome-regression-and-propensity-scores.html#cb30-75" tabindex="-1"></a>K1 <span class="ot">&lt;-</span></span>
-<span id="cb30-76"><a href="outcome-regression-and-propensity-scores.html#cb30-76" tabindex="-1"></a>  <span class="fu">makeContrastMatrix</span>(</span>
-<span id="cb30-77"><a href="outcome-regression-and-propensity-scores.html#cb30-77" tabindex="-1"></a>    fit,</span>
-<span id="cb30-78"><a href="outcome-regression-and-propensity-scores.html#cb30-78" tabindex="-1"></a>    <span class="dv">2</span>,</span>
-<span id="cb30-79"><a href="outcome-regression-and-propensity-scores.html#cb30-79" tabindex="-1"></a>    <span class="fu">c</span>(</span>
-<span id="cb30-80"><a href="outcome-regression-and-propensity-scores.html#cb30-80" tabindex="-1"></a>      <span class="st">&#39;Effect of Quitting Smoking at Smokeintensity of 5&#39;</span>,</span>
-<span id="cb30-81"><a href="outcome-regression-and-propensity-scores.html#cb30-81" tabindex="-1"></a>      <span class="st">&#39;Effect of Quitting Smoking at Smokeintensity of 40&#39;</span></span>
-<span id="cb30-82"><a href="outcome-regression-and-propensity-scores.html#cb30-82" tabindex="-1"></a>    )</span>
-<span id="cb30-83"><a href="outcome-regression-and-propensity-scores.html#cb30-83" tabindex="-1"></a>  )</span>
-<span id="cb30-84"><a href="outcome-regression-and-propensity-scores.html#cb30-84" tabindex="-1"></a><span class="co"># (step 2) fill in the relevant non-zero elements</span></span>
-<span id="cb30-85"><a href="outcome-regression-and-propensity-scores.html#cb30-85" tabindex="-1"></a>K1[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>, <span class="st">&#39;qsmk&#39;</span>] <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb30-86"><a href="outcome-regression-and-propensity-scores.html#cb30-86" tabindex="-1"></a>K1[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>, <span class="st">&#39;I(qsmk * smokeintensity)&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">5</span>, <span class="dv">40</span>)</span>
-<span id="cb30-87"><a href="outcome-regression-and-propensity-scores.html#cb30-87" tabindex="-1"></a></span>
-<span id="cb30-88"><a href="outcome-regression-and-propensity-scores.html#cb30-88" tabindex="-1"></a><span class="co"># (step 3) check the contrast matrix</span></span>
-<span id="cb30-89"><a href="outcome-regression-and-propensity-scores.html#cb30-89" tabindex="-1"></a>K1</span>
-<span id="cb30-90"><a href="outcome-regression-and-propensity-scores.html#cb30-90" tabindex="-1"></a><span class="co">#&gt;                                                    (Intercept) qsmk sex race</span></span>
-<span id="cb30-91"><a href="outcome-regression-and-propensity-scores.html#cb30-91" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5            0    1   0    0</span></span>
-<span id="cb30-92"><a href="outcome-regression-and-propensity-scores.html#cb30-92" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40           0    1   0    0</span></span>
-<span id="cb30-93"><a href="outcome-regression-and-propensity-scores.html#cb30-93" tabindex="-1"></a><span class="co">#&gt;                                                    age I(age * age)</span></span>
-<span id="cb30-94"><a href="outcome-regression-and-propensity-scores.html#cb30-94" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5    0            0</span></span>
-<span id="cb30-95"><a href="outcome-regression-and-propensity-scores.html#cb30-95" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40   0            0</span></span>
-<span id="cb30-96"><a href="outcome-regression-and-propensity-scores.html#cb30-96" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)2</span></span>
-<span id="cb30-97"><a href="outcome-regression-and-propensity-scores.html#cb30-97" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
-<span id="cb30-98"><a href="outcome-regression-and-propensity-scores.html#cb30-98" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
-<span id="cb30-99"><a href="outcome-regression-and-propensity-scores.html#cb30-99" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)3</span></span>
-<span id="cb30-100"><a href="outcome-regression-and-propensity-scores.html#cb30-100" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
-<span id="cb30-101"><a href="outcome-regression-and-propensity-scores.html#cb30-101" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
-<span id="cb30-102"><a href="outcome-regression-and-propensity-scores.html#cb30-102" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)4</span></span>
-<span id="cb30-103"><a href="outcome-regression-and-propensity-scores.html#cb30-103" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
-<span id="cb30-104"><a href="outcome-regression-and-propensity-scores.html#cb30-104" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
-<span id="cb30-105"><a href="outcome-regression-and-propensity-scores.html#cb30-105" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)5</span></span>
-<span id="cb30-106"><a href="outcome-regression-and-propensity-scores.html#cb30-106" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
-<span id="cb30-107"><a href="outcome-regression-and-propensity-scores.html#cb30-107" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
-<span id="cb30-108"><a href="outcome-regression-and-propensity-scores.html#cb30-108" tabindex="-1"></a><span class="co">#&gt;                                                    smokeintensity</span></span>
-<span id="cb30-109"><a href="outcome-regression-and-propensity-scores.html#cb30-109" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5               0</span></span>
-<span id="cb30-110"><a href="outcome-regression-and-propensity-scores.html#cb30-110" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40              0</span></span>
-<span id="cb30-111"><a href="outcome-regression-and-propensity-scores.html#cb30-111" tabindex="-1"></a><span class="co">#&gt;                                                    I(smokeintensity * smokeintensity)</span></span>
-<span id="cb30-112"><a href="outcome-regression-and-propensity-scores.html#cb30-112" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                                   0</span></span>
-<span id="cb30-113"><a href="outcome-regression-and-propensity-scores.html#cb30-113" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                                  0</span></span>
-<span id="cb30-114"><a href="outcome-regression-and-propensity-scores.html#cb30-114" tabindex="-1"></a><span class="co">#&gt;                                                    smokeyrs</span></span>
-<span id="cb30-115"><a href="outcome-regression-and-propensity-scores.html#cb30-115" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5         0</span></span>
-<span id="cb30-116"><a href="outcome-regression-and-propensity-scores.html#cb30-116" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40        0</span></span>
-<span id="cb30-117"><a href="outcome-regression-and-propensity-scores.html#cb30-117" tabindex="-1"></a><span class="co">#&gt;                                                    I(smokeyrs * smokeyrs)</span></span>
-<span id="cb30-118"><a href="outcome-regression-and-propensity-scores.html#cb30-118" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                       0</span></span>
-<span id="cb30-119"><a href="outcome-regression-and-propensity-scores.html#cb30-119" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                      0</span></span>
-<span id="cb30-120"><a href="outcome-regression-and-propensity-scores.html#cb30-120" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(exercise)1</span></span>
-<span id="cb30-121"><a href="outcome-regression-and-propensity-scores.html#cb30-121" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                     0</span></span>
-<span id="cb30-122"><a href="outcome-regression-and-propensity-scores.html#cb30-122" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                    0</span></span>
-<span id="cb30-123"><a href="outcome-regression-and-propensity-scores.html#cb30-123" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(exercise)2</span></span>
-<span id="cb30-124"><a href="outcome-regression-and-propensity-scores.html#cb30-124" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                     0</span></span>
-<span id="cb30-125"><a href="outcome-regression-and-propensity-scores.html#cb30-125" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                    0</span></span>
-<span id="cb30-126"><a href="outcome-regression-and-propensity-scores.html#cb30-126" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(active)1</span></span>
-<span id="cb30-127"><a href="outcome-regression-and-propensity-scores.html#cb30-127" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                   0</span></span>
-<span id="cb30-128"><a href="outcome-regression-and-propensity-scores.html#cb30-128" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                  0</span></span>
-<span id="cb30-129"><a href="outcome-regression-and-propensity-scores.html#cb30-129" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(active)2 wt71</span></span>
-<span id="cb30-130"><a href="outcome-regression-and-propensity-scores.html#cb30-130" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                   0    0</span></span>
-<span id="cb30-131"><a href="outcome-regression-and-propensity-scores.html#cb30-131" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                  0    0</span></span>
-<span id="cb30-132"><a href="outcome-regression-and-propensity-scores.html#cb30-132" tabindex="-1"></a><span class="co">#&gt;                                                    I(wt71 * wt71)</span></span>
-<span id="cb30-133"><a href="outcome-regression-and-propensity-scores.html#cb30-133" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5               0</span></span>
-<span id="cb30-134"><a href="outcome-regression-and-propensity-scores.html#cb30-134" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40              0</span></span>
-<span id="cb30-135"><a href="outcome-regression-and-propensity-scores.html#cb30-135" tabindex="-1"></a><span class="co">#&gt;                                                    I(qsmk * smokeintensity)</span></span>
-<span id="cb30-136"><a href="outcome-regression-and-propensity-scores.html#cb30-136" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                         5</span></span>
-<span id="cb30-137"><a href="outcome-regression-and-propensity-scores.html#cb30-137" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                       40</span></span>
-<span id="cb30-138"><a href="outcome-regression-and-propensity-scores.html#cb30-138" tabindex="-1"></a></span>
-<span id="cb30-139"><a href="outcome-regression-and-propensity-scores.html#cb30-139" tabindex="-1"></a><span class="co"># (step 4) estimate the contrasts, get tests and confidence intervals for them</span></span>
-<span id="cb30-140"><a href="outcome-regression-and-propensity-scores.html#cb30-140" tabindex="-1"></a>estimates1 <span class="ot">&lt;-</span> <span class="fu">glht</span>(fit, K1)</span>
-<span id="cb30-141"><a href="outcome-regression-and-propensity-scores.html#cb30-141" tabindex="-1"></a>  <span class="fu">summary</span>(estimates1)</span>
-<span id="cb30-142"><a href="outcome-regression-and-propensity-scores.html#cb30-142" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-143"><a href="outcome-regression-and-propensity-scores.html#cb30-143" tabindex="-1"></a><span class="co">#&gt;   Simultaneous Tests for General Linear Hypotheses</span></span>
-<span id="cb30-144"><a href="outcome-regression-and-propensity-scores.html#cb30-144" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-145"><a href="outcome-regression-and-propensity-scores.html#cb30-145" tabindex="-1"></a><span class="co">#&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb30-146"><a href="outcome-regression-and-propensity-scores.html#cb30-146" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb30-147"><a href="outcome-regression-and-propensity-scores.html#cb30-147" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb30-148"><a href="outcome-regression-and-propensity-scores.html#cb30-148" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
-<span id="cb30-149"><a href="outcome-regression-and-propensity-scores.html#cb30-149" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
-<span id="cb30-150"><a href="outcome-regression-and-propensity-scores.html#cb30-150" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-151"><a href="outcome-regression-and-propensity-scores.html#cb30-151" tabindex="-1"></a><span class="co">#&gt; Linear Hypotheses:</span></span>
-<span id="cb30-152"><a href="outcome-regression-and-propensity-scores.html#cb30-152" tabindex="-1"></a><span class="co">#&gt;                                                         Estimate Std. Error</span></span>
-<span id="cb30-153"><a href="outcome-regression-and-propensity-scores.html#cb30-153" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0    2.7929     0.6683</span></span>
-<span id="cb30-154"><a href="outcome-regression-and-propensity-scores.html#cb30-154" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0   4.4261     0.8478</span></span>
-<span id="cb30-155"><a href="outcome-regression-and-propensity-scores.html#cb30-155" tabindex="-1"></a><span class="co">#&gt;                                                         z value Pr(&gt;|z|)    </span></span>
-<span id="cb30-156"><a href="outcome-regression-and-propensity-scores.html#cb30-156" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0    4.179 5.84e-05 ***</span></span>
-<span id="cb30-157"><a href="outcome-regression-and-propensity-scores.html#cb30-157" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0   5.221 3.56e-07 ***</span></span>
-<span id="cb30-158"><a href="outcome-regression-and-propensity-scores.html#cb30-158" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb30-159"><a href="outcome-regression-and-propensity-scores.html#cb30-159" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb30-160"><a href="outcome-regression-and-propensity-scores.html#cb30-160" tabindex="-1"></a><span class="co">#&gt; (Adjusted p values reported -- single-step method)</span></span>
-<span id="cb30-161"><a href="outcome-regression-and-propensity-scores.html#cb30-161" tabindex="-1"></a>  <span class="fu">confint</span>(estimates1)</span>
-<span id="cb30-162"><a href="outcome-regression-and-propensity-scores.html#cb30-162" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-163"><a href="outcome-regression-and-propensity-scores.html#cb30-163" tabindex="-1"></a><span class="co">#&gt;   Simultaneous Confidence Intervals</span></span>
-<span id="cb30-164"><a href="outcome-regression-and-propensity-scores.html#cb30-164" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-165"><a href="outcome-regression-and-propensity-scores.html#cb30-165" tabindex="-1"></a><span class="co">#&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb30-166"><a href="outcome-regression-and-propensity-scores.html#cb30-166" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb30-167"><a href="outcome-regression-and-propensity-scores.html#cb30-167" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb30-168"><a href="outcome-regression-and-propensity-scores.html#cb30-168" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
-<span id="cb30-169"><a href="outcome-regression-and-propensity-scores.html#cb30-169" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
-<span id="cb30-170"><a href="outcome-regression-and-propensity-scores.html#cb30-170" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-171"><a href="outcome-regression-and-propensity-scores.html#cb30-171" tabindex="-1"></a><span class="co">#&gt; Quantile = 2.2281</span></span>
-<span id="cb30-172"><a href="outcome-regression-and-propensity-scores.html#cb30-172" tabindex="-1"></a><span class="co">#&gt; 95% family-wise confidence level</span></span>
-<span id="cb30-173"><a href="outcome-regression-and-propensity-scores.html#cb30-173" tabindex="-1"></a><span class="co">#&gt;  </span></span>
-<span id="cb30-174"><a href="outcome-regression-and-propensity-scores.html#cb30-174" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-175"><a href="outcome-regression-and-propensity-scores.html#cb30-175" tabindex="-1"></a><span class="co">#&gt; Linear Hypotheses:</span></span>
-<span id="cb30-176"><a href="outcome-regression-and-propensity-scores.html#cb30-176" tabindex="-1"></a><span class="co">#&gt;                                                         Estimate lwr    upr   </span></span>
-<span id="cb30-177"><a href="outcome-regression-and-propensity-scores.html#cb30-177" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0  2.7929   1.3039 4.2819</span></span>
-<span id="cb30-178"><a href="outcome-regression-and-propensity-scores.html#cb30-178" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261   2.5372 6.3151</span></span>
-<span id="cb30-179"><a href="outcome-regression-and-propensity-scores.html#cb30-179" tabindex="-1"></a></span>
-<span id="cb30-180"><a href="outcome-regression-and-propensity-scores.html#cb30-180" tabindex="-1"></a><span class="co"># regression on covariates, not allowing for effect modification</span></span>
-<span id="cb30-181"><a href="outcome-regression-and-propensity-scores.html#cb30-181" tabindex="-1"></a>fit2 <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb30-182"><a href="outcome-regression-and-propensity-scores.html#cb30-182" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb30-183"><a href="outcome-regression-and-propensity-scores.html#cb30-183" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb30-184"><a href="outcome-regression-and-propensity-scores.html#cb30-184" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71), <span class="at">data=</span>nhefs)</span>
-<span id="cb30-185"><a href="outcome-regression-and-propensity-scores.html#cb30-185" tabindex="-1"></a></span>
-<span id="cb30-186"><a href="outcome-regression-and-propensity-scores.html#cb30-186" tabindex="-1"></a><span class="fu">summary</span>(fit2)</span>
-<span id="cb30-187"><a href="outcome-regression-and-propensity-scores.html#cb30-187" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-188"><a href="outcome-regression-and-propensity-scores.html#cb30-188" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb30-189"><a href="outcome-regression-and-propensity-scores.html#cb30-189" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb30-190"><a href="outcome-regression-and-propensity-scores.html#cb30-190" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb30-191"><a href="outcome-regression-and-propensity-scores.html#cb30-191" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb30-192"><a href="outcome-regression-and-propensity-scores.html#cb30-192" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71), data = nhefs)</span></span>
-<span id="cb30-193"><a href="outcome-regression-and-propensity-scores.html#cb30-193" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-194"><a href="outcome-regression-and-propensity-scores.html#cb30-194" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb30-195"><a href="outcome-regression-and-propensity-scores.html#cb30-195" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb30-196"><a href="outcome-regression-and-propensity-scores.html#cb30-196" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.6586176  4.3137734  -0.384 0.700666    </span></span>
-<span id="cb30-197"><a href="outcome-regression-and-propensity-scores.html#cb30-197" tabindex="-1"></a><span class="co">#&gt; qsmk                                3.4626218  0.4384543   7.897 5.36e-15 ***</span></span>
-<span id="cb30-198"><a href="outcome-regression-and-propensity-scores.html#cb30-198" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4650496  0.4683410  -3.128 0.001792 ** </span></span>
-<span id="cb30-199"><a href="outcome-regression-and-propensity-scores.html#cb30-199" tabindex="-1"></a><span class="co">#&gt; race                                0.5864117  0.5816949   1.008 0.313560    </span></span>
-<span id="cb30-200"><a href="outcome-regression-and-propensity-scores.html#cb30-200" tabindex="-1"></a><span class="co">#&gt; age                                 0.3626624  0.1633431   2.220 0.026546 *  </span></span>
-<span id="cb30-201"><a href="outcome-regression-and-propensity-scores.html#cb30-201" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061377  0.0017263  -3.555 0.000389 ***</span></span>
-<span id="cb30-202"><a href="outcome-regression-and-propensity-scores.html#cb30-202" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.8185263  0.6067815   1.349 0.177546    </span></span>
-<span id="cb30-203"><a href="outcome-regression-and-propensity-scores.html#cb30-203" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5715004  0.5561211   1.028 0.304273    </span></span>
-<span id="cb30-204"><a href="outcome-regression-and-propensity-scores.html#cb30-204" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.5085173  0.8323778   1.812 0.070134 .  </span></span>
-<span id="cb30-205"><a href="outcome-regression-and-propensity-scores.html#cb30-205" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1708264  0.7413289  -0.230 0.817786    </span></span>
-<span id="cb30-206"><a href="outcome-regression-and-propensity-scores.html#cb30-206" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0651533  0.0503115   1.295 0.195514    </span></span>
-<span id="cb30-207"><a href="outcome-regression-and-propensity-scores.html#cb30-207" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0010468  0.0009373  -1.117 0.264261    </span></span>
-<span id="cb30-208"><a href="outcome-regression-and-propensity-scores.html#cb30-208" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1333931  0.0917319   1.454 0.146104    </span></span>
-<span id="cb30-209"><a href="outcome-regression-and-propensity-scores.html#cb30-209" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018270  0.0015438  -1.183 0.236818    </span></span>
-<span id="cb30-210"><a href="outcome-regression-and-propensity-scores.html#cb30-210" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.3206824  0.5349616   0.599 0.548961    </span></span>
-<span id="cb30-211"><a href="outcome-regression-and-propensity-scores.html#cb30-211" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3628786  0.5589557   0.649 0.516300    </span></span>
-<span id="cb30-212"><a href="outcome-regression-and-propensity-scores.html#cb30-212" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9429574  0.4100208  -2.300 0.021593 *  </span></span>
-<span id="cb30-213"><a href="outcome-regression-and-propensity-scores.html#cb30-213" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2580374  0.6847219  -0.377 0.706337    </span></span>
-<span id="cb30-214"><a href="outcome-regression-and-propensity-scores.html#cb30-214" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0373642  0.0831658   0.449 0.653297    </span></span>
-<span id="cb30-215"><a href="outcome-regression-and-propensity-scores.html#cb30-215" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009158  0.0005235  -1.749 0.080426 .  </span></span>
-<span id="cb30-216"><a href="outcome-regression-and-propensity-scores.html#cb30-216" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb30-217"><a href="outcome-regression-and-propensity-scores.html#cb30-217" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb30-218"><a href="outcome-regression-and-propensity-scores.html#cb30-218" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-219"><a href="outcome-regression-and-propensity-scores.html#cb30-219" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.59474)</span></span>
-<span id="cb30-220"><a href="outcome-regression-and-propensity-scores.html#cb30-220" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-221"><a href="outcome-regression-and-propensity-scores.html#cb30-221" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb30-222"><a href="outcome-regression-and-propensity-scores.html#cb30-222" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82857  on 1546  degrees of freedom</span></span>
-<span id="cb30-223"><a href="outcome-regression-and-propensity-scores.html#cb30-223" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb30-224"><a href="outcome-regression-and-propensity-scores.html#cb30-224" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
-<span id="cb30-225"><a href="outcome-regression-and-propensity-scores.html#cb30-225" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb30-226"><a href="outcome-regression-and-propensity-scores.html#cb30-226" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb111"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb111-1"><a href="outcome-regression-and-propensity-scores.html#cb111-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb112"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb112-1"><a href="outcome-regression-and-propensity-scores.html#cb112-1" tabindex="-1"></a><span class="co">#install.packages(&quot;readxl&quot;) # install package if required</span></span>
+<span id="cb112-2"><a href="outcome-regression-and-propensity-scores.html#cb112-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb112-3"><a href="outcome-regression-and-propensity-scores.html#cb112-3" tabindex="-1"></a></span>
+<span id="cb112-4"><a href="outcome-regression-and-propensity-scores.html#cb112-4" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb112-5"><a href="outcome-regression-and-propensity-scores.html#cb112-5" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb112-6"><a href="outcome-regression-and-propensity-scores.html#cb112-6" tabindex="-1"></a></span>
+<span id="cb112-7"><a href="outcome-regression-and-propensity-scores.html#cb112-7" tabindex="-1"></a><span class="co"># regression on covariates, allowing for some effect modification</span></span>
+<span id="cb112-8"><a href="outcome-regression-and-propensity-scores.html#cb112-8" tabindex="-1"></a>fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb112-9"><a href="outcome-regression-and-propensity-scores.html#cb112-9" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb112-10"><a href="outcome-regression-and-propensity-scores.html#cb112-10" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb112-11"><a href="outcome-regression-and-propensity-scores.html#cb112-11" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71) <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>smokeintensity), <span class="at">data=</span>nhefs)</span>
+<span id="cb112-12"><a href="outcome-regression-and-propensity-scores.html#cb112-12" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
+<span id="cb112-13"><a href="outcome-regression-and-propensity-scores.html#cb112-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb112-14"><a href="outcome-regression-and-propensity-scores.html#cb112-14" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb112-15"><a href="outcome-regression-and-propensity-scores.html#cb112-15" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb112-16"><a href="outcome-regression-and-propensity-scores.html#cb112-16" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb112-17"><a href="outcome-regression-and-propensity-scores.html#cb112-17" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb112-18"><a href="outcome-regression-and-propensity-scores.html#cb112-18" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
+<span id="cb112-19"><a href="outcome-regression-and-propensity-scores.html#cb112-19" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
+<span id="cb112-20"><a href="outcome-regression-and-propensity-scores.html#cb112-20" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb112-21"><a href="outcome-regression-and-propensity-scores.html#cb112-21" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb112-22"><a href="outcome-regression-and-propensity-scores.html#cb112-22" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb112-23"><a href="outcome-regression-and-propensity-scores.html#cb112-23" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
+<span id="cb112-24"><a href="outcome-regression-and-propensity-scores.html#cb112-24" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
+<span id="cb112-25"><a href="outcome-regression-and-propensity-scores.html#cb112-25" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
+<span id="cb112-26"><a href="outcome-regression-and-propensity-scores.html#cb112-26" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
+<span id="cb112-27"><a href="outcome-regression-and-propensity-scores.html#cb112-27" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
+<span id="cb112-28"><a href="outcome-regression-and-propensity-scores.html#cb112-28" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
+<span id="cb112-29"><a href="outcome-regression-and-propensity-scores.html#cb112-29" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
+<span id="cb112-30"><a href="outcome-regression-and-propensity-scores.html#cb112-30" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
+<span id="cb112-31"><a href="outcome-regression-and-propensity-scores.html#cb112-31" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
+<span id="cb112-32"><a href="outcome-regression-and-propensity-scores.html#cb112-32" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
+<span id="cb112-33"><a href="outcome-regression-and-propensity-scores.html#cb112-33" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
+<span id="cb112-34"><a href="outcome-regression-and-propensity-scores.html#cb112-34" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
+<span id="cb112-35"><a href="outcome-regression-and-propensity-scores.html#cb112-35" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
+<span id="cb112-36"><a href="outcome-regression-and-propensity-scores.html#cb112-36" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
+<span id="cb112-37"><a href="outcome-regression-and-propensity-scores.html#cb112-37" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
+<span id="cb112-38"><a href="outcome-regression-and-propensity-scores.html#cb112-38" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
+<span id="cb112-39"><a href="outcome-regression-and-propensity-scores.html#cb112-39" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
+<span id="cb112-40"><a href="outcome-regression-and-propensity-scores.html#cb112-40" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
+<span id="cb112-41"><a href="outcome-regression-and-propensity-scores.html#cb112-41" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
+<span id="cb112-42"><a href="outcome-regression-and-propensity-scores.html#cb112-42" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
+<span id="cb112-43"><a href="outcome-regression-and-propensity-scores.html#cb112-43" tabindex="-1"></a><span class="co">#&gt; I(qsmk * smokeintensity)            0.0466628  0.0351448   1.328 0.184463    </span></span>
+<span id="cb112-44"><a href="outcome-regression-and-propensity-scores.html#cb112-44" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb112-45"><a href="outcome-regression-and-propensity-scores.html#cb112-45" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb112-46"><a href="outcome-regression-and-propensity-scores.html#cb112-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb112-47"><a href="outcome-regression-and-propensity-scores.html#cb112-47" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
+<span id="cb112-48"><a href="outcome-regression-and-propensity-scores.html#cb112-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb112-49"><a href="outcome-regression-and-propensity-scores.html#cb112-49" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb112-50"><a href="outcome-regression-and-propensity-scores.html#cb112-50" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
+<span id="cb112-51"><a href="outcome-regression-and-propensity-scores.html#cb112-51" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb112-52"><a href="outcome-regression-and-propensity-scores.html#cb112-52" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
+<span id="cb112-53"><a href="outcome-regression-and-propensity-scores.html#cb112-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb112-54"><a href="outcome-regression-and-propensity-scores.html#cb112-54" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb113"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb113-1"><a href="outcome-regression-and-propensity-scores.html#cb113-1" tabindex="-1"></a></span>
+<span id="cb113-2"><a href="outcome-regression-and-propensity-scores.html#cb113-2" tabindex="-1"></a><span class="co"># (step 1) build the contrast matrix with all zeros</span></span>
+<span id="cb113-3"><a href="outcome-regression-and-propensity-scores.html#cb113-3" tabindex="-1"></a><span class="co"># this function builds the blank matrix</span></span>
+<span id="cb113-4"><a href="outcome-regression-and-propensity-scores.html#cb113-4" tabindex="-1"></a><span class="co"># install.packages(&quot;multcomp&quot;) # install packages if necessary</span></span>
+<span id="cb113-5"><a href="outcome-regression-and-propensity-scores.html#cb113-5" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;multcomp&quot;</span>)</span>
+<span id="cb113-6"><a href="outcome-regression-and-propensity-scores.html#cb113-6" tabindex="-1"></a><span class="co">#&gt; Loading required package: mvtnorm</span></span>
+<span id="cb113-7"><a href="outcome-regression-and-propensity-scores.html#cb113-7" tabindex="-1"></a><span class="co">#&gt; Loading required package: survival</span></span>
+<span id="cb113-8"><a href="outcome-regression-and-propensity-scores.html#cb113-8" tabindex="-1"></a><span class="co">#&gt; Loading required package: TH.data</span></span>
+<span id="cb113-9"><a href="outcome-regression-and-propensity-scores.html#cb113-9" tabindex="-1"></a><span class="co">#&gt; Loading required package: MASS</span></span>
+<span id="cb113-10"><a href="outcome-regression-and-propensity-scores.html#cb113-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb113-11"><a href="outcome-regression-and-propensity-scores.html#cb113-11" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;TH.data&#39;</span></span>
+<span id="cb113-12"><a href="outcome-regression-and-propensity-scores.html#cb113-12" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:MASS&#39;:</span></span>
+<span id="cb113-13"><a href="outcome-regression-and-propensity-scores.html#cb113-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb113-14"><a href="outcome-regression-and-propensity-scores.html#cb113-14" tabindex="-1"></a><span class="co">#&gt;     geyser</span></span></code></pre></div>
+<div class="sourceCode" id="cb114"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb114-1"><a href="outcome-regression-and-propensity-scores.html#cb114-1" tabindex="-1"></a>makeContrastMatrix <span class="ot">&lt;-</span> <span class="cf">function</span>(model, nrow, names) {</span>
+<span id="cb114-2"><a href="outcome-regression-and-propensity-scores.html#cb114-2" tabindex="-1"></a>  m <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="dv">0</span>, <span class="at">nrow =</span> nrow, <span class="at">ncol =</span> <span class="fu">length</span>(<span class="fu">coef</span>(model)))</span>
+<span id="cb114-3"><a href="outcome-regression-and-propensity-scores.html#cb114-3" tabindex="-1"></a>  <span class="fu">colnames</span>(m) <span class="ot">&lt;-</span> <span class="fu">names</span>(<span class="fu">coef</span>(model))</span>
+<span id="cb114-4"><a href="outcome-regression-and-propensity-scores.html#cb114-4" tabindex="-1"></a>  <span class="fu">rownames</span>(m) <span class="ot">&lt;-</span> names</span>
+<span id="cb114-5"><a href="outcome-regression-and-propensity-scores.html#cb114-5" tabindex="-1"></a>  <span class="fu">return</span>(m)</span>
+<span id="cb114-6"><a href="outcome-regression-and-propensity-scores.html#cb114-6" tabindex="-1"></a>}</span>
+<span id="cb114-7"><a href="outcome-regression-and-propensity-scores.html#cb114-7" tabindex="-1"></a>K1 <span class="ot">&lt;-</span></span>
+<span id="cb114-8"><a href="outcome-regression-and-propensity-scores.html#cb114-8" tabindex="-1"></a>  <span class="fu">makeContrastMatrix</span>(</span>
+<span id="cb114-9"><a href="outcome-regression-and-propensity-scores.html#cb114-9" tabindex="-1"></a>    fit,</span>
+<span id="cb114-10"><a href="outcome-regression-and-propensity-scores.html#cb114-10" tabindex="-1"></a>    <span class="dv">2</span>,</span>
+<span id="cb114-11"><a href="outcome-regression-and-propensity-scores.html#cb114-11" tabindex="-1"></a>    <span class="fu">c</span>(</span>
+<span id="cb114-12"><a href="outcome-regression-and-propensity-scores.html#cb114-12" tabindex="-1"></a>      <span class="st">&#39;Effect of Quitting Smoking at Smokeintensity of 5&#39;</span>,</span>
+<span id="cb114-13"><a href="outcome-regression-and-propensity-scores.html#cb114-13" tabindex="-1"></a>      <span class="st">&#39;Effect of Quitting Smoking at Smokeintensity of 40&#39;</span></span>
+<span id="cb114-14"><a href="outcome-regression-and-propensity-scores.html#cb114-14" tabindex="-1"></a>    )</span>
+<span id="cb114-15"><a href="outcome-regression-and-propensity-scores.html#cb114-15" tabindex="-1"></a>  )</span>
+<span id="cb114-16"><a href="outcome-regression-and-propensity-scores.html#cb114-16" tabindex="-1"></a><span class="co"># (step 2) fill in the relevant non-zero elements</span></span>
+<span id="cb114-17"><a href="outcome-regression-and-propensity-scores.html#cb114-17" tabindex="-1"></a>K1[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>, <span class="st">&#39;qsmk&#39;</span>] <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb114-18"><a href="outcome-regression-and-propensity-scores.html#cb114-18" tabindex="-1"></a>K1[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>, <span class="st">&#39;I(qsmk * smokeintensity)&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">5</span>, <span class="dv">40</span>)</span>
+<span id="cb114-19"><a href="outcome-regression-and-propensity-scores.html#cb114-19" tabindex="-1"></a></span>
+<span id="cb114-20"><a href="outcome-regression-and-propensity-scores.html#cb114-20" tabindex="-1"></a><span class="co"># (step 3) check the contrast matrix</span></span>
+<span id="cb114-21"><a href="outcome-regression-and-propensity-scores.html#cb114-21" tabindex="-1"></a>K1</span>
+<span id="cb114-22"><a href="outcome-regression-and-propensity-scores.html#cb114-22" tabindex="-1"></a><span class="co">#&gt;                                                    (Intercept) qsmk sex race</span></span>
+<span id="cb114-23"><a href="outcome-regression-and-propensity-scores.html#cb114-23" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5            0    1   0    0</span></span>
+<span id="cb114-24"><a href="outcome-regression-and-propensity-scores.html#cb114-24" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40           0    1   0    0</span></span>
+<span id="cb114-25"><a href="outcome-regression-and-propensity-scores.html#cb114-25" tabindex="-1"></a><span class="co">#&gt;                                                    age I(age * age)</span></span>
+<span id="cb114-26"><a href="outcome-regression-and-propensity-scores.html#cb114-26" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5    0            0</span></span>
+<span id="cb114-27"><a href="outcome-regression-and-propensity-scores.html#cb114-27" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40   0            0</span></span>
+<span id="cb114-28"><a href="outcome-regression-and-propensity-scores.html#cb114-28" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)2</span></span>
+<span id="cb114-29"><a href="outcome-regression-and-propensity-scores.html#cb114-29" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
+<span id="cb114-30"><a href="outcome-regression-and-propensity-scores.html#cb114-30" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
+<span id="cb114-31"><a href="outcome-regression-and-propensity-scores.html#cb114-31" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)3</span></span>
+<span id="cb114-32"><a href="outcome-regression-and-propensity-scores.html#cb114-32" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
+<span id="cb114-33"><a href="outcome-regression-and-propensity-scores.html#cb114-33" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
+<span id="cb114-34"><a href="outcome-regression-and-propensity-scores.html#cb114-34" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)4</span></span>
+<span id="cb114-35"><a href="outcome-regression-and-propensity-scores.html#cb114-35" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
+<span id="cb114-36"><a href="outcome-regression-and-propensity-scores.html#cb114-36" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
+<span id="cb114-37"><a href="outcome-regression-and-propensity-scores.html#cb114-37" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(education)5</span></span>
+<span id="cb114-38"><a href="outcome-regression-and-propensity-scores.html#cb114-38" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                      0</span></span>
+<span id="cb114-39"><a href="outcome-regression-and-propensity-scores.html#cb114-39" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                     0</span></span>
+<span id="cb114-40"><a href="outcome-regression-and-propensity-scores.html#cb114-40" tabindex="-1"></a><span class="co">#&gt;                                                    smokeintensity</span></span>
+<span id="cb114-41"><a href="outcome-regression-and-propensity-scores.html#cb114-41" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5               0</span></span>
+<span id="cb114-42"><a href="outcome-regression-and-propensity-scores.html#cb114-42" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40              0</span></span>
+<span id="cb114-43"><a href="outcome-regression-and-propensity-scores.html#cb114-43" tabindex="-1"></a><span class="co">#&gt;                                                    I(smokeintensity * smokeintensity)</span></span>
+<span id="cb114-44"><a href="outcome-regression-and-propensity-scores.html#cb114-44" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                                   0</span></span>
+<span id="cb114-45"><a href="outcome-regression-and-propensity-scores.html#cb114-45" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                                  0</span></span>
+<span id="cb114-46"><a href="outcome-regression-and-propensity-scores.html#cb114-46" tabindex="-1"></a><span class="co">#&gt;                                                    smokeyrs</span></span>
+<span id="cb114-47"><a href="outcome-regression-and-propensity-scores.html#cb114-47" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5         0</span></span>
+<span id="cb114-48"><a href="outcome-regression-and-propensity-scores.html#cb114-48" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40        0</span></span>
+<span id="cb114-49"><a href="outcome-regression-and-propensity-scores.html#cb114-49" tabindex="-1"></a><span class="co">#&gt;                                                    I(smokeyrs * smokeyrs)</span></span>
+<span id="cb114-50"><a href="outcome-regression-and-propensity-scores.html#cb114-50" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                       0</span></span>
+<span id="cb114-51"><a href="outcome-regression-and-propensity-scores.html#cb114-51" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                      0</span></span>
+<span id="cb114-52"><a href="outcome-regression-and-propensity-scores.html#cb114-52" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(exercise)1</span></span>
+<span id="cb114-53"><a href="outcome-regression-and-propensity-scores.html#cb114-53" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                     0</span></span>
+<span id="cb114-54"><a href="outcome-regression-and-propensity-scores.html#cb114-54" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                    0</span></span>
+<span id="cb114-55"><a href="outcome-regression-and-propensity-scores.html#cb114-55" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(exercise)2</span></span>
+<span id="cb114-56"><a href="outcome-regression-and-propensity-scores.html#cb114-56" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                     0</span></span>
+<span id="cb114-57"><a href="outcome-regression-and-propensity-scores.html#cb114-57" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                    0</span></span>
+<span id="cb114-58"><a href="outcome-regression-and-propensity-scores.html#cb114-58" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(active)1</span></span>
+<span id="cb114-59"><a href="outcome-regression-and-propensity-scores.html#cb114-59" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                   0</span></span>
+<span id="cb114-60"><a href="outcome-regression-and-propensity-scores.html#cb114-60" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                  0</span></span>
+<span id="cb114-61"><a href="outcome-regression-and-propensity-scores.html#cb114-61" tabindex="-1"></a><span class="co">#&gt;                                                    as.factor(active)2 wt71</span></span>
+<span id="cb114-62"><a href="outcome-regression-and-propensity-scores.html#cb114-62" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                   0    0</span></span>
+<span id="cb114-63"><a href="outcome-regression-and-propensity-scores.html#cb114-63" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                  0    0</span></span>
+<span id="cb114-64"><a href="outcome-regression-and-propensity-scores.html#cb114-64" tabindex="-1"></a><span class="co">#&gt;                                                    I(wt71 * wt71)</span></span>
+<span id="cb114-65"><a href="outcome-regression-and-propensity-scores.html#cb114-65" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5               0</span></span>
+<span id="cb114-66"><a href="outcome-regression-and-propensity-scores.html#cb114-66" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40              0</span></span>
+<span id="cb114-67"><a href="outcome-regression-and-propensity-scores.html#cb114-67" tabindex="-1"></a><span class="co">#&gt;                                                    I(qsmk * smokeintensity)</span></span>
+<span id="cb114-68"><a href="outcome-regression-and-propensity-scores.html#cb114-68" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5                         5</span></span>
+<span id="cb114-69"><a href="outcome-regression-and-propensity-scores.html#cb114-69" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40                       40</span></span></code></pre></div>
+<div class="sourceCode" id="cb115"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb115-1"><a href="outcome-regression-and-propensity-scores.html#cb115-1" tabindex="-1"></a></span>
+<span id="cb115-2"><a href="outcome-regression-and-propensity-scores.html#cb115-2" tabindex="-1"></a><span class="co"># (step 4) estimate the contrasts, get tests and confidence intervals for them</span></span>
+<span id="cb115-3"><a href="outcome-regression-and-propensity-scores.html#cb115-3" tabindex="-1"></a>estimates1 <span class="ot">&lt;-</span> <span class="fu">glht</span>(fit, K1)</span>
+<span id="cb115-4"><a href="outcome-regression-and-propensity-scores.html#cb115-4" tabindex="-1"></a>  <span class="fu">summary</span>(estimates1)</span>
+<span id="cb115-5"><a href="outcome-regression-and-propensity-scores.html#cb115-5" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb115-6"><a href="outcome-regression-and-propensity-scores.html#cb115-6" tabindex="-1"></a><span class="co">#&gt;   Simultaneous Tests for General Linear Hypotheses</span></span>
+<span id="cb115-7"><a href="outcome-regression-and-propensity-scores.html#cb115-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb115-8"><a href="outcome-regression-and-propensity-scores.html#cb115-8" tabindex="-1"></a><span class="co">#&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb115-9"><a href="outcome-regression-and-propensity-scores.html#cb115-9" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb115-10"><a href="outcome-regression-and-propensity-scores.html#cb115-10" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb115-11"><a href="outcome-regression-and-propensity-scores.html#cb115-11" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
+<span id="cb115-12"><a href="outcome-regression-and-propensity-scores.html#cb115-12" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
+<span id="cb115-13"><a href="outcome-regression-and-propensity-scores.html#cb115-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb115-14"><a href="outcome-regression-and-propensity-scores.html#cb115-14" tabindex="-1"></a><span class="co">#&gt; Linear Hypotheses:</span></span>
+<span id="cb115-15"><a href="outcome-regression-and-propensity-scores.html#cb115-15" tabindex="-1"></a><span class="co">#&gt;                                                         Estimate Std. Error</span></span>
+<span id="cb115-16"><a href="outcome-regression-and-propensity-scores.html#cb115-16" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0    2.7929     0.6683</span></span>
+<span id="cb115-17"><a href="outcome-regression-and-propensity-scores.html#cb115-17" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0   4.4261     0.8478</span></span>
+<span id="cb115-18"><a href="outcome-regression-and-propensity-scores.html#cb115-18" tabindex="-1"></a><span class="co">#&gt;                                                         z value Pr(&gt;|z|)    </span></span>
+<span id="cb115-19"><a href="outcome-regression-and-propensity-scores.html#cb115-19" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0    4.179 5.84e-05 ***</span></span>
+<span id="cb115-20"><a href="outcome-regression-and-propensity-scores.html#cb115-20" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0   5.221 3.56e-07 ***</span></span>
+<span id="cb115-21"><a href="outcome-regression-and-propensity-scores.html#cb115-21" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb115-22"><a href="outcome-regression-and-propensity-scores.html#cb115-22" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb115-23"><a href="outcome-regression-and-propensity-scores.html#cb115-23" tabindex="-1"></a><span class="co">#&gt; (Adjusted p values reported -- single-step method)</span></span></code></pre></div>
+<div class="sourceCode" id="cb116"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb116-1"><a href="outcome-regression-and-propensity-scores.html#cb116-1" tabindex="-1"></a>  <span class="fu">confint</span>(estimates1)</span>
+<span id="cb116-2"><a href="outcome-regression-and-propensity-scores.html#cb116-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb116-3"><a href="outcome-regression-and-propensity-scores.html#cb116-3" tabindex="-1"></a><span class="co">#&gt;   Simultaneous Confidence Intervals</span></span>
+<span id="cb116-4"><a href="outcome-regression-and-propensity-scores.html#cb116-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb116-5"><a href="outcome-regression-and-propensity-scores.html#cb116-5" tabindex="-1"></a><span class="co">#&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb116-6"><a href="outcome-regression-and-propensity-scores.html#cb116-6" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb116-7"><a href="outcome-regression-and-propensity-scores.html#cb116-7" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb116-8"><a href="outcome-regression-and-propensity-scores.html#cb116-8" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
+<span id="cb116-9"><a href="outcome-regression-and-propensity-scores.html#cb116-9" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
+<span id="cb116-10"><a href="outcome-regression-and-propensity-scores.html#cb116-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb116-11"><a href="outcome-regression-and-propensity-scores.html#cb116-11" tabindex="-1"></a><span class="co">#&gt; Quantile = 2.2281</span></span>
+<span id="cb116-12"><a href="outcome-regression-and-propensity-scores.html#cb116-12" tabindex="-1"></a><span class="co">#&gt; 95% family-wise confidence level</span></span>
+<span id="cb116-13"><a href="outcome-regression-and-propensity-scores.html#cb116-13" tabindex="-1"></a><span class="co">#&gt;  </span></span>
+<span id="cb116-14"><a href="outcome-regression-and-propensity-scores.html#cb116-14" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb116-15"><a href="outcome-regression-and-propensity-scores.html#cb116-15" tabindex="-1"></a><span class="co">#&gt; Linear Hypotheses:</span></span>
+<span id="cb116-16"><a href="outcome-regression-and-propensity-scores.html#cb116-16" tabindex="-1"></a><span class="co">#&gt;                                                         Estimate lwr    upr   </span></span>
+<span id="cb116-17"><a href="outcome-regression-and-propensity-scores.html#cb116-17" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0  2.7929   1.3039 4.2819</span></span>
+<span id="cb116-18"><a href="outcome-regression-and-propensity-scores.html#cb116-18" tabindex="-1"></a><span class="co">#&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261   2.5372 6.3151</span></span></code></pre></div>
+<div class="sourceCode" id="cb117"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb117-1"><a href="outcome-regression-and-propensity-scores.html#cb117-1" tabindex="-1"></a></span>
+<span id="cb117-2"><a href="outcome-regression-and-propensity-scores.html#cb117-2" tabindex="-1"></a><span class="co"># regression on covariates, not allowing for effect modification</span></span>
+<span id="cb117-3"><a href="outcome-regression-and-propensity-scores.html#cb117-3" tabindex="-1"></a>fit2 <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb117-4"><a href="outcome-regression-and-propensity-scores.html#cb117-4" tabindex="-1"></a>           <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb117-5"><a href="outcome-regression-and-propensity-scores.html#cb117-5" tabindex="-1"></a>           <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb117-6"><a href="outcome-regression-and-propensity-scores.html#cb117-6" tabindex="-1"></a>           <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71), <span class="at">data=</span>nhefs)</span>
+<span id="cb117-7"><a href="outcome-regression-and-propensity-scores.html#cb117-7" tabindex="-1"></a></span>
+<span id="cb117-8"><a href="outcome-regression-and-propensity-scores.html#cb117-8" tabindex="-1"></a><span class="fu">summary</span>(fit2)</span>
+<span id="cb117-9"><a href="outcome-regression-and-propensity-scores.html#cb117-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb117-10"><a href="outcome-regression-and-propensity-scores.html#cb117-10" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb117-11"><a href="outcome-regression-and-propensity-scores.html#cb117-11" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb117-12"><a href="outcome-regression-and-propensity-scores.html#cb117-12" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb117-13"><a href="outcome-regression-and-propensity-scores.html#cb117-13" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb117-14"><a href="outcome-regression-and-propensity-scores.html#cb117-14" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71), data = nhefs)</span></span>
+<span id="cb117-15"><a href="outcome-regression-and-propensity-scores.html#cb117-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb117-16"><a href="outcome-regression-and-propensity-scores.html#cb117-16" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb117-17"><a href="outcome-regression-and-propensity-scores.html#cb117-17" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb117-18"><a href="outcome-regression-and-propensity-scores.html#cb117-18" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.6586176  4.3137734  -0.384 0.700666    </span></span>
+<span id="cb117-19"><a href="outcome-regression-and-propensity-scores.html#cb117-19" tabindex="-1"></a><span class="co">#&gt; qsmk                                3.4626218  0.4384543   7.897 5.36e-15 ***</span></span>
+<span id="cb117-20"><a href="outcome-regression-and-propensity-scores.html#cb117-20" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4650496  0.4683410  -3.128 0.001792 ** </span></span>
+<span id="cb117-21"><a href="outcome-regression-and-propensity-scores.html#cb117-21" tabindex="-1"></a><span class="co">#&gt; race                                0.5864117  0.5816949   1.008 0.313560    </span></span>
+<span id="cb117-22"><a href="outcome-regression-and-propensity-scores.html#cb117-22" tabindex="-1"></a><span class="co">#&gt; age                                 0.3626624  0.1633431   2.220 0.026546 *  </span></span>
+<span id="cb117-23"><a href="outcome-regression-and-propensity-scores.html#cb117-23" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061377  0.0017263  -3.555 0.000389 ***</span></span>
+<span id="cb117-24"><a href="outcome-regression-and-propensity-scores.html#cb117-24" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.8185263  0.6067815   1.349 0.177546    </span></span>
+<span id="cb117-25"><a href="outcome-regression-and-propensity-scores.html#cb117-25" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5715004  0.5561211   1.028 0.304273    </span></span>
+<span id="cb117-26"><a href="outcome-regression-and-propensity-scores.html#cb117-26" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.5085173  0.8323778   1.812 0.070134 .  </span></span>
+<span id="cb117-27"><a href="outcome-regression-and-propensity-scores.html#cb117-27" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1708264  0.7413289  -0.230 0.817786    </span></span>
+<span id="cb117-28"><a href="outcome-regression-and-propensity-scores.html#cb117-28" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0651533  0.0503115   1.295 0.195514    </span></span>
+<span id="cb117-29"><a href="outcome-regression-and-propensity-scores.html#cb117-29" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0010468  0.0009373  -1.117 0.264261    </span></span>
+<span id="cb117-30"><a href="outcome-regression-and-propensity-scores.html#cb117-30" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1333931  0.0917319   1.454 0.146104    </span></span>
+<span id="cb117-31"><a href="outcome-regression-and-propensity-scores.html#cb117-31" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018270  0.0015438  -1.183 0.236818    </span></span>
+<span id="cb117-32"><a href="outcome-regression-and-propensity-scores.html#cb117-32" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.3206824  0.5349616   0.599 0.548961    </span></span>
+<span id="cb117-33"><a href="outcome-regression-and-propensity-scores.html#cb117-33" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3628786  0.5589557   0.649 0.516300    </span></span>
+<span id="cb117-34"><a href="outcome-regression-and-propensity-scores.html#cb117-34" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9429574  0.4100208  -2.300 0.021593 *  </span></span>
+<span id="cb117-35"><a href="outcome-regression-and-propensity-scores.html#cb117-35" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2580374  0.6847219  -0.377 0.706337    </span></span>
+<span id="cb117-36"><a href="outcome-regression-and-propensity-scores.html#cb117-36" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0373642  0.0831658   0.449 0.653297    </span></span>
+<span id="cb117-37"><a href="outcome-regression-and-propensity-scores.html#cb117-37" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009158  0.0005235  -1.749 0.080426 .  </span></span>
+<span id="cb117-38"><a href="outcome-regression-and-propensity-scores.html#cb117-38" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb117-39"><a href="outcome-regression-and-propensity-scores.html#cb117-39" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb117-40"><a href="outcome-regression-and-propensity-scores.html#cb117-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb117-41"><a href="outcome-regression-and-propensity-scores.html#cb117-41" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.59474)</span></span>
+<span id="cb117-42"><a href="outcome-regression-and-propensity-scores.html#cb117-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb117-43"><a href="outcome-regression-and-propensity-scores.html#cb117-43" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb117-44"><a href="outcome-regression-and-propensity-scores.html#cb117-44" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82857  on 1546  degrees of freedom</span></span>
+<span id="cb117-45"><a href="outcome-regression-and-propensity-scores.html#cb117-45" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb117-46"><a href="outcome-regression-and-propensity-scores.html#cb117-46" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
+<span id="cb117-47"><a href="outcome-regression-and-propensity-scores.html#cb117-47" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb117-48"><a href="outcome-regression-and-propensity-scores.html#cb117-48" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
 </div>
 <div id="program-15.2" class="section level2 hasAnchor">
 <h2>Program 15.2<a href="outcome-regression-and-propensity-scores.html#program-15.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -550,117 +550,117 @@ <h2>Program 15.2<a href="outcome-regression-and-propensity-scores.html#program-1
 <li>Estimating and plotting the propensity score</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb31"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb31-1"><a href="outcome-regression-and-propensity-scores.html#cb31-1" tabindex="-1"></a>fit3 <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb31-2"><a href="outcome-regression-and-propensity-scores.html#cb31-2" tabindex="-1"></a>            <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb31-3"><a href="outcome-regression-and-propensity-scores.html#cb31-3" tabindex="-1"></a>            <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb31-4"><a href="outcome-regression-and-propensity-scores.html#cb31-4" tabindex="-1"></a>            <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71), <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb31-5"><a href="outcome-regression-and-propensity-scores.html#cb31-5" tabindex="-1"></a><span class="fu">summary</span>(fit3)</span>
-<span id="cb31-6"><a href="outcome-regression-and-propensity-scores.html#cb31-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-7"><a href="outcome-regression-and-propensity-scores.html#cb31-7" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb31-8"><a href="outcome-regression-and-propensity-scores.html#cb31-8" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + </span></span>
-<span id="cb31-9"><a href="outcome-regression-and-propensity-scores.html#cb31-9" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + </span></span>
-<span id="cb31-10"><a href="outcome-regression-and-propensity-scores.html#cb31-10" tabindex="-1"></a><span class="co">#&gt;     I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + </span></span>
-<span id="cb31-11"><a href="outcome-regression-and-propensity-scores.html#cb31-11" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71 * wt71), family = binomial(), data = nhefs)</span></span>
-<span id="cb31-12"><a href="outcome-regression-and-propensity-scores.html#cb31-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-13"><a href="outcome-regression-and-propensity-scores.html#cb31-13" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb31-14"><a href="outcome-regression-and-propensity-scores.html#cb31-14" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
-<span id="cb31-15"><a href="outcome-regression-and-propensity-scores.html#cb31-15" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.9889022  1.2412792  -1.602 0.109089    </span></span>
-<span id="cb31-16"><a href="outcome-regression-and-propensity-scores.html#cb31-16" tabindex="-1"></a><span class="co">#&gt; sex                                -0.5075218  0.1482316  -3.424 0.000617 ***</span></span>
-<span id="cb31-17"><a href="outcome-regression-and-propensity-scores.html#cb31-17" tabindex="-1"></a><span class="co">#&gt; race                               -0.8502312  0.2058720  -4.130 3.63e-05 ***</span></span>
-<span id="cb31-18"><a href="outcome-regression-and-propensity-scores.html#cb31-18" tabindex="-1"></a><span class="co">#&gt; age                                 0.1030132  0.0488996   2.107 0.035150 *  </span></span>
-<span id="cb31-19"><a href="outcome-regression-and-propensity-scores.html#cb31-19" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0006052  0.0005074  -1.193 0.232973    </span></span>
-<span id="cb31-20"><a href="outcome-regression-and-propensity-scores.html#cb31-20" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2              -0.0983203  0.1906553  -0.516 0.606066    </span></span>
-<span id="cb31-21"><a href="outcome-regression-and-propensity-scores.html#cb31-21" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.0156987  0.1707139   0.092 0.926730    </span></span>
-<span id="cb31-22"><a href="outcome-regression-and-propensity-scores.html#cb31-22" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4              -0.0425260  0.2642761  -0.161 0.872160    </span></span>
-<span id="cb31-23"><a href="outcome-regression-and-propensity-scores.html#cb31-23" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               0.3796632  0.2203947   1.723 0.084952 .  </span></span>
-<span id="cb31-24"><a href="outcome-regression-and-propensity-scores.html#cb31-24" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -0.0651561  0.0147589  -4.415 1.01e-05 ***</span></span>
-<span id="cb31-25"><a href="outcome-regression-and-propensity-scores.html#cb31-25" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity)  0.0008461  0.0002758   3.067 0.002160 ** </span></span>
-<span id="cb31-26"><a href="outcome-regression-and-propensity-scores.html#cb31-26" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -0.0733708  0.0269958  -2.718 0.006571 ** </span></span>
-<span id="cb31-27"><a href="outcome-regression-and-propensity-scores.html#cb31-27" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)              0.0008384  0.0004435   1.891 0.058669 .  </span></span>
-<span id="cb31-28"><a href="outcome-regression-and-propensity-scores.html#cb31-28" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2914117  0.1735543   1.679 0.093136 .  </span></span>
-<span id="cb31-29"><a href="outcome-regression-and-propensity-scores.html#cb31-29" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3550517  0.1799293   1.973 0.048463 *  </span></span>
-<span id="cb31-30"><a href="outcome-regression-and-propensity-scores.html#cb31-30" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                  0.0108754  0.1298320   0.084 0.933243    </span></span>
-<span id="cb31-31"><a href="outcome-regression-and-propensity-scores.html#cb31-31" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                  0.0683123  0.2087269   0.327 0.743455    </span></span>
-<span id="cb31-32"><a href="outcome-regression-and-propensity-scores.html#cb31-32" tabindex="-1"></a><span class="co">#&gt; wt71                               -0.0128478  0.0222829  -0.577 0.564226    </span></span>
-<span id="cb31-33"><a href="outcome-regression-and-propensity-scores.html#cb31-33" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                      0.0001209  0.0001352   0.895 0.370957    </span></span>
-<span id="cb31-34"><a href="outcome-regression-and-propensity-scores.html#cb31-34" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb31-35"><a href="outcome-regression-and-propensity-scores.html#cb31-35" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb31-36"><a href="outcome-regression-and-propensity-scores.html#cb31-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-37"><a href="outcome-regression-and-propensity-scores.html#cb31-37" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
-<span id="cb31-38"><a href="outcome-regression-and-propensity-scores.html#cb31-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-39"><a href="outcome-regression-and-propensity-scores.html#cb31-39" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
-<span id="cb31-40"><a href="outcome-regression-and-propensity-scores.html#cb31-40" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1766.7  on 1610  degrees of freedom</span></span>
-<span id="cb31-41"><a href="outcome-regression-and-propensity-scores.html#cb31-41" tabindex="-1"></a><span class="co">#&gt; AIC: 1804.7</span></span>
-<span id="cb31-42"><a href="outcome-regression-and-propensity-scores.html#cb31-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-43"><a href="outcome-regression-and-propensity-scores.html#cb31-43" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span>
-<span id="cb31-44"><a href="outcome-regression-and-propensity-scores.html#cb31-44" tabindex="-1"></a>nhefs<span class="sc">$</span>ps <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit3, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb31-45"><a href="outcome-regression-and-propensity-scores.html#cb31-45" tabindex="-1"></a></span>
-<span id="cb31-46"><a href="outcome-regression-and-propensity-scores.html#cb31-46" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>ps[nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span>])</span>
-<span id="cb31-47"><a href="outcome-regression-and-propensity-scores.html#cb31-47" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb31-48"><a href="outcome-regression-and-propensity-scores.html#cb31-48" tabindex="-1"></a><span class="co">#&gt; 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788</span></span>
-<span id="cb31-49"><a href="outcome-regression-and-propensity-scores.html#cb31-49" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>ps[nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span>])</span>
-<span id="cb31-50"><a href="outcome-regression-and-propensity-scores.html#cb31-50" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb31-51"><a href="outcome-regression-and-propensity-scores.html#cb31-51" tabindex="-1"></a><span class="co">#&gt; 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320</span></span>
-<span id="cb31-52"><a href="outcome-regression-and-propensity-scores.html#cb31-52" tabindex="-1"></a></span>
-<span id="cb31-53"><a href="outcome-regression-and-propensity-scores.html#cb31-53" tabindex="-1"></a><span class="co"># # plotting the estimated propensity score</span></span>
-<span id="cb31-54"><a href="outcome-regression-and-propensity-scores.html#cb31-54" tabindex="-1"></a><span class="co"># install.packages(&quot;ggplot2&quot;) # install packages if necessary</span></span>
-<span id="cb31-55"><a href="outcome-regression-and-propensity-scores.html#cb31-55" tabindex="-1"></a><span class="co"># install.packages(&quot;dplyr&quot;)</span></span>
-<span id="cb31-56"><a href="outcome-regression-and-propensity-scores.html#cb31-56" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;ggplot2&quot;</span>)</span>
-<span id="cb31-57"><a href="outcome-regression-and-propensity-scores.html#cb31-57" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;dplyr&quot;</span>)</span>
-<span id="cb31-58"><a href="outcome-regression-and-propensity-scores.html#cb31-58" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-59"><a href="outcome-regression-and-propensity-scores.html#cb31-59" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;dplyr&#39;</span></span>
-<span id="cb31-60"><a href="outcome-regression-and-propensity-scores.html#cb31-60" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:MASS&#39;:</span></span>
-<span id="cb31-61"><a href="outcome-regression-and-propensity-scores.html#cb31-61" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-62"><a href="outcome-regression-and-propensity-scores.html#cb31-62" tabindex="-1"></a><span class="co">#&gt;     select</span></span>
-<span id="cb31-63"><a href="outcome-regression-and-propensity-scores.html#cb31-63" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:stats&#39;:</span></span>
-<span id="cb31-64"><a href="outcome-regression-and-propensity-scores.html#cb31-64" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-65"><a href="outcome-regression-and-propensity-scores.html#cb31-65" tabindex="-1"></a><span class="co">#&gt;     filter, lag</span></span>
-<span id="cb31-66"><a href="outcome-regression-and-propensity-scores.html#cb31-66" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
-<span id="cb31-67"><a href="outcome-regression-and-propensity-scores.html#cb31-67" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb31-68"><a href="outcome-regression-and-propensity-scores.html#cb31-68" tabindex="-1"></a><span class="co">#&gt;     intersect, setdiff, setequal, union</span></span>
-<span id="cb31-69"><a href="outcome-regression-and-propensity-scores.html#cb31-69" tabindex="-1"></a><span class="fu">ggplot</span>(nhefs, <span class="fu">aes</span>(<span class="at">x =</span> ps, <span class="at">fill =</span> qsmk)) <span class="sc">+</span> <span class="fu">geom_density</span>(<span class="at">alpha =</span> <span class="fl">0.2</span>) <span class="sc">+</span></span>
-<span id="cb31-70"><a href="outcome-regression-and-propensity-scores.html#cb31-70" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
-<span id="cb31-71"><a href="outcome-regression-and-propensity-scores.html#cb31-71" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
-<span id="cb31-72"><a href="outcome-regression-and-propensity-scores.html#cb31-72" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
-<span id="cb31-73"><a href="outcome-regression-and-propensity-scores.html#cb31-73" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>)</span>
-<span id="cb31-74"><a href="outcome-regression-and-propensity-scores.html#cb31-74" tabindex="-1"></a><span class="co">#&gt; Warning: The following aesthetics were dropped during statistical transformation: fill.</span></span>
-<span id="cb31-75"><a href="outcome-regression-and-propensity-scores.html#cb31-75" tabindex="-1"></a><span class="co">#&gt; ℹ This can happen when ggplot fails to infer the correct grouping structure in</span></span>
-<span id="cb31-76"><a href="outcome-regression-and-propensity-scores.html#cb31-76" tabindex="-1"></a><span class="co">#&gt;   the data.</span></span>
-<span id="cb31-77"><a href="outcome-regression-and-propensity-scores.html#cb31-77" tabindex="-1"></a><span class="co">#&gt; ℹ Did you forget to specify a `group` aesthetic or to convert a numerical</span></span>
-<span id="cb31-78"><a href="outcome-regression-and-propensity-scores.html#cb31-78" tabindex="-1"></a><span class="co">#&gt;   variable into a factor?</span></span></code></pre></div>
+<div class="sourceCode" id="cb118"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb118-1"><a href="outcome-regression-and-propensity-scores.html#cb118-1" tabindex="-1"></a>fit3 <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb118-2"><a href="outcome-regression-and-propensity-scores.html#cb118-2" tabindex="-1"></a>            <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb118-3"><a href="outcome-regression-and-propensity-scores.html#cb118-3" tabindex="-1"></a>            <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb118-4"><a href="outcome-regression-and-propensity-scores.html#cb118-4" tabindex="-1"></a>            <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71), <span class="at">data=</span>nhefs, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb118-5"><a href="outcome-regression-and-propensity-scores.html#cb118-5" tabindex="-1"></a><span class="fu">summary</span>(fit3)</span>
+<span id="cb118-6"><a href="outcome-regression-and-propensity-scores.html#cb118-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb118-7"><a href="outcome-regression-and-propensity-scores.html#cb118-7" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb118-8"><a href="outcome-regression-and-propensity-scores.html#cb118-8" tabindex="-1"></a><span class="co">#&gt; glm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + </span></span>
+<span id="cb118-9"><a href="outcome-regression-and-propensity-scores.html#cb118-9" tabindex="-1"></a><span class="co">#&gt;     smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + </span></span>
+<span id="cb118-10"><a href="outcome-regression-and-propensity-scores.html#cb118-10" tabindex="-1"></a><span class="co">#&gt;     I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + </span></span>
+<span id="cb118-11"><a href="outcome-regression-and-propensity-scores.html#cb118-11" tabindex="-1"></a><span class="co">#&gt;     wt71 + I(wt71 * wt71), family = binomial(), data = nhefs)</span></span>
+<span id="cb118-12"><a href="outcome-regression-and-propensity-scores.html#cb118-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb118-13"><a href="outcome-regression-and-propensity-scores.html#cb118-13" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb118-14"><a href="outcome-regression-and-propensity-scores.html#cb118-14" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error z value Pr(&gt;|z|)    </span></span>
+<span id="cb118-15"><a href="outcome-regression-and-propensity-scores.html#cb118-15" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.9889022  1.2412792  -1.602 0.109089    </span></span>
+<span id="cb118-16"><a href="outcome-regression-and-propensity-scores.html#cb118-16" tabindex="-1"></a><span class="co">#&gt; sex                                -0.5075218  0.1482316  -3.424 0.000617 ***</span></span>
+<span id="cb118-17"><a href="outcome-regression-and-propensity-scores.html#cb118-17" tabindex="-1"></a><span class="co">#&gt; race                               -0.8502312  0.2058720  -4.130 3.63e-05 ***</span></span>
+<span id="cb118-18"><a href="outcome-regression-and-propensity-scores.html#cb118-18" tabindex="-1"></a><span class="co">#&gt; age                                 0.1030132  0.0488996   2.107 0.035150 *  </span></span>
+<span id="cb118-19"><a href="outcome-regression-and-propensity-scores.html#cb118-19" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0006052  0.0005074  -1.193 0.232973    </span></span>
+<span id="cb118-20"><a href="outcome-regression-and-propensity-scores.html#cb118-20" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2              -0.0983203  0.1906553  -0.516 0.606066    </span></span>
+<span id="cb118-21"><a href="outcome-regression-and-propensity-scores.html#cb118-21" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.0156987  0.1707139   0.092 0.926730    </span></span>
+<span id="cb118-22"><a href="outcome-regression-and-propensity-scores.html#cb118-22" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4              -0.0425260  0.2642761  -0.161 0.872160    </span></span>
+<span id="cb118-23"><a href="outcome-regression-and-propensity-scores.html#cb118-23" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5               0.3796632  0.2203947   1.723 0.084952 .  </span></span>
+<span id="cb118-24"><a href="outcome-regression-and-propensity-scores.html#cb118-24" tabindex="-1"></a><span class="co">#&gt; smokeintensity                     -0.0651561  0.0147589  -4.415 1.01e-05 ***</span></span>
+<span id="cb118-25"><a href="outcome-regression-and-propensity-scores.html#cb118-25" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity)  0.0008461  0.0002758   3.067 0.002160 ** </span></span>
+<span id="cb118-26"><a href="outcome-regression-and-propensity-scores.html#cb118-26" tabindex="-1"></a><span class="co">#&gt; smokeyrs                           -0.0733708  0.0269958  -2.718 0.006571 ** </span></span>
+<span id="cb118-27"><a href="outcome-regression-and-propensity-scores.html#cb118-27" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)              0.0008384  0.0004435   1.891 0.058669 .  </span></span>
+<span id="cb118-28"><a href="outcome-regression-and-propensity-scores.html#cb118-28" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2914117  0.1735543   1.679 0.093136 .  </span></span>
+<span id="cb118-29"><a href="outcome-regression-and-propensity-scores.html#cb118-29" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3550517  0.1799293   1.973 0.048463 *  </span></span>
+<span id="cb118-30"><a href="outcome-regression-and-propensity-scores.html#cb118-30" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                  0.0108754  0.1298320   0.084 0.933243    </span></span>
+<span id="cb118-31"><a href="outcome-regression-and-propensity-scores.html#cb118-31" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                  0.0683123  0.2087269   0.327 0.743455    </span></span>
+<span id="cb118-32"><a href="outcome-regression-and-propensity-scores.html#cb118-32" tabindex="-1"></a><span class="co">#&gt; wt71                               -0.0128478  0.0222829  -0.577 0.564226    </span></span>
+<span id="cb118-33"><a href="outcome-regression-and-propensity-scores.html#cb118-33" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                      0.0001209  0.0001352   0.895 0.370957    </span></span>
+<span id="cb118-34"><a href="outcome-regression-and-propensity-scores.html#cb118-34" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb118-35"><a href="outcome-regression-and-propensity-scores.html#cb118-35" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb118-36"><a href="outcome-regression-and-propensity-scores.html#cb118-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb118-37"><a href="outcome-regression-and-propensity-scores.html#cb118-37" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for binomial family taken to be 1)</span></span>
+<span id="cb118-38"><a href="outcome-regression-and-propensity-scores.html#cb118-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb118-39"><a href="outcome-regression-and-propensity-scores.html#cb118-39" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 1876.3  on 1628  degrees of freedom</span></span>
+<span id="cb118-40"><a href="outcome-regression-and-propensity-scores.html#cb118-40" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 1766.7  on 1610  degrees of freedom</span></span>
+<span id="cb118-41"><a href="outcome-regression-and-propensity-scores.html#cb118-41" tabindex="-1"></a><span class="co">#&gt; AIC: 1804.7</span></span>
+<span id="cb118-42"><a href="outcome-regression-and-propensity-scores.html#cb118-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb118-43"><a href="outcome-regression-and-propensity-scores.html#cb118-43" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 4</span></span></code></pre></div>
+<div class="sourceCode" id="cb119"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb119-1"><a href="outcome-regression-and-propensity-scores.html#cb119-1" tabindex="-1"></a>nhefs<span class="sc">$</span>ps <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit3, nhefs, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb119-2"><a href="outcome-regression-and-propensity-scores.html#cb119-2" tabindex="-1"></a></span>
+<span id="cb119-3"><a href="outcome-regression-and-propensity-scores.html#cb119-3" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>ps[nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">0</span>])</span>
+<span id="cb119-4"><a href="outcome-regression-and-propensity-scores.html#cb119-4" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb119-5"><a href="outcome-regression-and-propensity-scores.html#cb119-5" tabindex="-1"></a><span class="co">#&gt; 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788</span></span></code></pre></div>
+<div class="sourceCode" id="cb120"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb120-1"><a href="outcome-regression-and-propensity-scores.html#cb120-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>ps[nhefs<span class="sc">$</span>qsmk<span class="sc">==</span><span class="dv">1</span>])</span>
+<span id="cb120-2"><a href="outcome-regression-and-propensity-scores.html#cb120-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb120-3"><a href="outcome-regression-and-propensity-scores.html#cb120-3" tabindex="-1"></a><span class="co">#&gt; 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320</span></span></code></pre></div>
+<div class="sourceCode" id="cb121"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb121-1"><a href="outcome-regression-and-propensity-scores.html#cb121-1" tabindex="-1"></a></span>
+<span id="cb121-2"><a href="outcome-regression-and-propensity-scores.html#cb121-2" tabindex="-1"></a><span class="co"># # plotting the estimated propensity score</span></span>
+<span id="cb121-3"><a href="outcome-regression-and-propensity-scores.html#cb121-3" tabindex="-1"></a><span class="co"># install.packages(&quot;ggplot2&quot;) # install packages if necessary</span></span>
+<span id="cb121-4"><a href="outcome-regression-and-propensity-scores.html#cb121-4" tabindex="-1"></a><span class="co"># install.packages(&quot;dplyr&quot;)</span></span>
+<span id="cb121-5"><a href="outcome-regression-and-propensity-scores.html#cb121-5" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;ggplot2&quot;</span>)</span>
+<span id="cb121-6"><a href="outcome-regression-and-propensity-scores.html#cb121-6" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;dplyr&quot;</span>)</span>
+<span id="cb121-7"><a href="outcome-regression-and-propensity-scores.html#cb121-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb121-8"><a href="outcome-regression-and-propensity-scores.html#cb121-8" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;dplyr&#39;</span></span>
+<span id="cb121-9"><a href="outcome-regression-and-propensity-scores.html#cb121-9" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:MASS&#39;:</span></span>
+<span id="cb121-10"><a href="outcome-regression-and-propensity-scores.html#cb121-10" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb121-11"><a href="outcome-regression-and-propensity-scores.html#cb121-11" tabindex="-1"></a><span class="co">#&gt;     select</span></span>
+<span id="cb121-12"><a href="outcome-regression-and-propensity-scores.html#cb121-12" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:stats&#39;:</span></span>
+<span id="cb121-13"><a href="outcome-regression-and-propensity-scores.html#cb121-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb121-14"><a href="outcome-regression-and-propensity-scores.html#cb121-14" tabindex="-1"></a><span class="co">#&gt;     filter, lag</span></span>
+<span id="cb121-15"><a href="outcome-regression-and-propensity-scores.html#cb121-15" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:base&#39;:</span></span>
+<span id="cb121-16"><a href="outcome-regression-and-propensity-scores.html#cb121-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb121-17"><a href="outcome-regression-and-propensity-scores.html#cb121-17" tabindex="-1"></a><span class="co">#&gt;     intersect, setdiff, setequal, union</span></span></code></pre></div>
+<div class="sourceCode" id="cb122"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb122-1"><a href="outcome-regression-and-propensity-scores.html#cb122-1" tabindex="-1"></a><span class="fu">ggplot</span>(nhefs, <span class="fu">aes</span>(<span class="at">x =</span> ps, <span class="at">fill =</span> qsmk)) <span class="sc">+</span> <span class="fu">geom_density</span>(<span class="at">alpha =</span> <span class="fl">0.2</span>) <span class="sc">+</span></span>
+<span id="cb122-2"><a href="outcome-regression-and-propensity-scores.html#cb122-2" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
+<span id="cb122-3"><a href="outcome-regression-and-propensity-scores.html#cb122-3" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
+<span id="cb122-4"><a href="outcome-regression-and-propensity-scores.html#cb122-4" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
+<span id="cb122-5"><a href="outcome-regression-and-propensity-scores.html#cb122-5" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>)</span>
+<span id="cb122-6"><a href="outcome-regression-and-propensity-scores.html#cb122-6" tabindex="-1"></a><span class="co">#&gt; Warning: The following aesthetics were dropped during statistical transformation: fill.</span></span>
+<span id="cb122-7"><a href="outcome-regression-and-propensity-scores.html#cb122-7" tabindex="-1"></a><span class="co">#&gt; ℹ This can happen when ggplot fails to infer the correct grouping structure in</span></span>
+<span id="cb122-8"><a href="outcome-regression-and-propensity-scores.html#cb122-8" tabindex="-1"></a><span class="co">#&gt;   the data.</span></span>
+<span id="cb122-9"><a href="outcome-regression-and-propensity-scores.html#cb122-9" tabindex="-1"></a><span class="co">#&gt; ℹ Did you forget to specify a `group` aesthetic or to convert a numerical</span></span>
+<span id="cb122-10"><a href="outcome-regression-and-propensity-scores.html#cb122-10" tabindex="-1"></a><span class="co">#&gt;   variable into a factor?</span></span></code></pre></div>
 <p><img src="15-prop-scores-r_files/figure-html/unnamed-chunk-3-1.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb32"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb32-1"><a href="outcome-regression-and-propensity-scores.html#cb32-1" tabindex="-1"></a></span>
-<span id="cb32-2"><a href="outcome-regression-and-propensity-scores.html#cb32-2" tabindex="-1"></a><span class="co"># alternative plot with histograms</span></span>
-<span id="cb32-3"><a href="outcome-regression-and-propensity-scores.html#cb32-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> nhefs <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">qsmklabel =</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">1</span>,</span>
-<span id="cb32-4"><a href="outcome-regression-and-propensity-scores.html#cb32-4" tabindex="-1"></a>                       <span class="at">yes =</span> <span class="st">&#39;Quit Smoking 1971-1982&#39;</span>,</span>
-<span id="cb32-5"><a href="outcome-regression-and-propensity-scores.html#cb32-5" tabindex="-1"></a>                       <span class="at">no =</span> <span class="st">&#39;Did Not Quit Smoking 1971-1982&#39;</span>))</span>
-<span id="cb32-6"><a href="outcome-regression-and-propensity-scores.html#cb32-6" tabindex="-1"></a><span class="fu">ggplot</span>(nhefs, <span class="fu">aes</span>(<span class="at">x =</span> ps, <span class="at">fill =</span> <span class="fu">as.factor</span>(qsmk), <span class="at">color =</span> <span class="fu">as.factor</span>(qsmk))) <span class="sc">+</span></span>
-<span id="cb32-7"><a href="outcome-regression-and-propensity-scores.html#cb32-7" tabindex="-1"></a>  <span class="fu">geom_histogram</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>, <span class="at">position =</span> <span class="st">&#39;identity&#39;</span>, <span class="at">bins=</span><span class="dv">15</span>) <span class="sc">+</span></span>
-<span id="cb32-8"><a href="outcome-regression-and-propensity-scores.html#cb32-8" tabindex="-1"></a>  <span class="fu">facet_grid</span>(<span class="fu">as.factor</span>(qsmk) <span class="sc">~</span> .) <span class="sc">+</span></span>
-<span id="cb32-9"><a href="outcome-regression-and-propensity-scores.html#cb32-9" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
-<span id="cb32-10"><a href="outcome-regression-and-propensity-scores.html#cb32-10" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
-<span id="cb32-11"><a href="outcome-regression-and-propensity-scores.html#cb32-11" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
-<span id="cb32-12"><a href="outcome-regression-and-propensity-scores.html#cb32-12" tabindex="-1"></a>  <span class="fu">scale_color_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
-<span id="cb32-13"><a href="outcome-regression-and-propensity-scores.html#cb32-13" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb123"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb123-1"><a href="outcome-regression-and-propensity-scores.html#cb123-1" tabindex="-1"></a></span>
+<span id="cb123-2"><a href="outcome-regression-and-propensity-scores.html#cb123-2" tabindex="-1"></a><span class="co"># alternative plot with histograms</span></span>
+<span id="cb123-3"><a href="outcome-regression-and-propensity-scores.html#cb123-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> nhefs <span class="sc">%&gt;%</span> <span class="fu">mutate</span>(<span class="at">qsmklabel =</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">1</span>,</span>
+<span id="cb123-4"><a href="outcome-regression-and-propensity-scores.html#cb123-4" tabindex="-1"></a>                       <span class="at">yes =</span> <span class="st">&#39;Quit Smoking 1971-1982&#39;</span>,</span>
+<span id="cb123-5"><a href="outcome-regression-and-propensity-scores.html#cb123-5" tabindex="-1"></a>                       <span class="at">no =</span> <span class="st">&#39;Did Not Quit Smoking 1971-1982&#39;</span>))</span>
+<span id="cb123-6"><a href="outcome-regression-and-propensity-scores.html#cb123-6" tabindex="-1"></a><span class="fu">ggplot</span>(nhefs, <span class="fu">aes</span>(<span class="at">x =</span> ps, <span class="at">fill =</span> <span class="fu">as.factor</span>(qsmk), <span class="at">color =</span> <span class="fu">as.factor</span>(qsmk))) <span class="sc">+</span></span>
+<span id="cb123-7"><a href="outcome-regression-and-propensity-scores.html#cb123-7" tabindex="-1"></a>  <span class="fu">geom_histogram</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>, <span class="at">position =</span> <span class="st">&#39;identity&#39;</span>, <span class="at">bins=</span><span class="dv">15</span>) <span class="sc">+</span></span>
+<span id="cb123-8"><a href="outcome-regression-and-propensity-scores.html#cb123-8" tabindex="-1"></a>  <span class="fu">facet_grid</span>(<span class="fu">as.factor</span>(qsmk) <span class="sc">~</span> .) <span class="sc">+</span></span>
+<span id="cb123-9"><a href="outcome-regression-and-propensity-scores.html#cb123-9" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
+<span id="cb123-10"><a href="outcome-regression-and-propensity-scores.html#cb123-10" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
+<span id="cb123-11"><a href="outcome-regression-and-propensity-scores.html#cb123-11" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
+<span id="cb123-12"><a href="outcome-regression-and-propensity-scores.html#cb123-12" tabindex="-1"></a>  <span class="fu">scale_color_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
+<span id="cb123-13"><a href="outcome-regression-and-propensity-scores.html#cb123-13" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>)</span></code></pre></div>
 <p><img src="15-prop-scores-r_files/figure-html/unnamed-chunk-3-2.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb33"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb33-1"><a href="outcome-regression-and-propensity-scores.html#cb33-1" tabindex="-1"></a><span class="co"># attempt to reproduce plot from the book</span></span>
-<span id="cb33-2"><a href="outcome-regression-and-propensity-scores.html#cb33-2" tabindex="-1"></a>nhefs <span class="sc">%&gt;%</span></span>
-<span id="cb33-3"><a href="outcome-regression-and-propensity-scores.html#cb33-3" tabindex="-1"></a>  <span class="fu">mutate</span>(<span class="at">ps.grp =</span> <span class="fu">round</span>(ps<span class="sc">/</span><span class="fl">0.05</span>) <span class="sc">*</span> <span class="fl">0.05</span>) <span class="sc">%&gt;%</span></span>
-<span id="cb33-4"><a href="outcome-regression-and-propensity-scores.html#cb33-4" tabindex="-1"></a>  <span class="fu">group_by</span>(qsmk, ps.grp) <span class="sc">%&gt;%</span></span>
-<span id="cb33-5"><a href="outcome-regression-and-propensity-scores.html#cb33-5" tabindex="-1"></a>  <span class="fu">summarize</span>(<span class="at">n =</span> <span class="fu">n</span>()) <span class="sc">%&gt;%</span></span>
-<span id="cb33-6"><a href="outcome-regression-and-propensity-scores.html#cb33-6" tabindex="-1"></a>  <span class="fu">ungroup</span>() <span class="sc">%&gt;%</span></span>
-<span id="cb33-7"><a href="outcome-regression-and-propensity-scores.html#cb33-7" tabindex="-1"></a>  <span class="fu">mutate</span>(<span class="at">n2 =</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">0</span>, <span class="at">yes =</span> n, <span class="at">no =</span>  <span class="sc">-</span><span class="dv">1</span><span class="sc">*</span>n)) <span class="sc">%&gt;%</span></span>
-<span id="cb33-8"><a href="outcome-regression-and-propensity-scores.html#cb33-8" tabindex="-1"></a>  <span class="fu">ggplot</span>(<span class="fu">aes</span>(<span class="at">x =</span> ps.grp, <span class="at">y =</span> n2, <span class="at">fill =</span> <span class="fu">as.factor</span>(qsmk))) <span class="sc">+</span></span>
-<span id="cb33-9"><a href="outcome-regression-and-propensity-scores.html#cb33-9" tabindex="-1"></a>  <span class="fu">geom_bar</span>(<span class="at">stat =</span> <span class="st">&#39;identity&#39;</span>, <span class="at">position =</span> <span class="st">&#39;identity&#39;</span>) <span class="sc">+</span></span>
-<span id="cb33-10"><a href="outcome-regression-and-propensity-scores.html#cb33-10" tabindex="-1"></a>  <span class="fu">geom_text</span>(<span class="fu">aes</span>(<span class="at">label =</span> n, <span class="at">x =</span> ps.grp, <span class="at">y =</span> n2 <span class="sc">+</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">0</span>, <span class="dv">8</span>, <span class="sc">-</span><span class="dv">8</span>))) <span class="sc">+</span></span>
-<span id="cb33-11"><a href="outcome-regression-and-propensity-scores.html#cb33-11" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
-<span id="cb33-12"><a href="outcome-regression-and-propensity-scores.html#cb33-12" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&#39;N&#39;</span>) <span class="sc">+</span></span>
-<span id="cb33-13"><a href="outcome-regression-and-propensity-scores.html#cb33-13" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
-<span id="cb33-14"><a href="outcome-regression-and-propensity-scores.html#cb33-14" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
-<span id="cb33-15"><a href="outcome-regression-and-propensity-scores.html#cb33-15" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">breaks =</span> <span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="fl">0.05</span>)) <span class="sc">+</span></span>
-<span id="cb33-16"><a href="outcome-regression-and-propensity-scores.html#cb33-16" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>,</span>
-<span id="cb33-17"><a href="outcome-regression-and-propensity-scores.html#cb33-17" tabindex="-1"></a>        <span class="at">axis.ticks.y =</span> <span class="fu">element_blank</span>(),</span>
-<span id="cb33-18"><a href="outcome-regression-and-propensity-scores.html#cb33-18" tabindex="-1"></a>        <span class="at">axis.text.y =</span> <span class="fu">element_blank</span>())</span></code></pre></div>
+<div class="sourceCode" id="cb124"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb124-1"><a href="outcome-regression-and-propensity-scores.html#cb124-1" tabindex="-1"></a><span class="co"># attempt to reproduce plot from the book</span></span>
+<span id="cb124-2"><a href="outcome-regression-and-propensity-scores.html#cb124-2" tabindex="-1"></a>nhefs <span class="sc">%&gt;%</span></span>
+<span id="cb124-3"><a href="outcome-regression-and-propensity-scores.html#cb124-3" tabindex="-1"></a>  <span class="fu">mutate</span>(<span class="at">ps.grp =</span> <span class="fu">round</span>(ps<span class="sc">/</span><span class="fl">0.05</span>) <span class="sc">*</span> <span class="fl">0.05</span>) <span class="sc">%&gt;%</span></span>
+<span id="cb124-4"><a href="outcome-regression-and-propensity-scores.html#cb124-4" tabindex="-1"></a>  <span class="fu">group_by</span>(qsmk, ps.grp) <span class="sc">%&gt;%</span></span>
+<span id="cb124-5"><a href="outcome-regression-and-propensity-scores.html#cb124-5" tabindex="-1"></a>  <span class="fu">summarize</span>(<span class="at">n =</span> <span class="fu">n</span>()) <span class="sc">%&gt;%</span></span>
+<span id="cb124-6"><a href="outcome-regression-and-propensity-scores.html#cb124-6" tabindex="-1"></a>  <span class="fu">ungroup</span>() <span class="sc">%&gt;%</span></span>
+<span id="cb124-7"><a href="outcome-regression-and-propensity-scores.html#cb124-7" tabindex="-1"></a>  <span class="fu">mutate</span>(<span class="at">n2 =</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">0</span>, <span class="at">yes =</span> n, <span class="at">no =</span>  <span class="sc">-</span><span class="dv">1</span><span class="sc">*</span>n)) <span class="sc">%&gt;%</span></span>
+<span id="cb124-8"><a href="outcome-regression-and-propensity-scores.html#cb124-8" tabindex="-1"></a>  <span class="fu">ggplot</span>(<span class="fu">aes</span>(<span class="at">x =</span> ps.grp, <span class="at">y =</span> n2, <span class="at">fill =</span> <span class="fu">as.factor</span>(qsmk))) <span class="sc">+</span></span>
+<span id="cb124-9"><a href="outcome-regression-and-propensity-scores.html#cb124-9" tabindex="-1"></a>  <span class="fu">geom_bar</span>(<span class="at">stat =</span> <span class="st">&#39;identity&#39;</span>, <span class="at">position =</span> <span class="st">&#39;identity&#39;</span>) <span class="sc">+</span></span>
+<span id="cb124-10"><a href="outcome-regression-and-propensity-scores.html#cb124-10" tabindex="-1"></a>  <span class="fu">geom_text</span>(<span class="fu">aes</span>(<span class="at">label =</span> n, <span class="at">x =</span> ps.grp, <span class="at">y =</span> n2 <span class="sc">+</span> <span class="fu">ifelse</span>(qsmk <span class="sc">==</span> <span class="dv">0</span>, <span class="dv">8</span>, <span class="sc">-</span><span class="dv">8</span>))) <span class="sc">+</span></span>
+<span id="cb124-11"><a href="outcome-regression-and-propensity-scores.html#cb124-11" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&#39;Probability of Quitting Smoking During Follow-up&#39;</span>) <span class="sc">+</span></span>
+<span id="cb124-12"><a href="outcome-regression-and-propensity-scores.html#cb124-12" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&#39;N&#39;</span>) <span class="sc">+</span></span>
+<span id="cb124-13"><a href="outcome-regression-and-propensity-scores.html#cb124-13" tabindex="-1"></a>  <span class="fu">ggtitle</span>(<span class="st">&#39;Propensity Score Distribution by Treatment Group&#39;</span>) <span class="sc">+</span></span>
+<span id="cb124-14"><a href="outcome-regression-and-propensity-scores.html#cb124-14" tabindex="-1"></a>  <span class="fu">scale_fill_discrete</span>(<span class="st">&#39;&#39;</span>) <span class="sc">+</span></span>
+<span id="cb124-15"><a href="outcome-regression-and-propensity-scores.html#cb124-15" tabindex="-1"></a>  <span class="fu">scale_x_continuous</span>(<span class="at">breaks =</span> <span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="fl">0.05</span>)) <span class="sc">+</span></span>
+<span id="cb124-16"><a href="outcome-regression-and-propensity-scores.html#cb124-16" tabindex="-1"></a>  <span class="fu">theme</span>(<span class="at">legend.position =</span> <span class="st">&#39;bottom&#39;</span>, <span class="at">legend.direction =</span> <span class="st">&#39;vertical&#39;</span>,</span>
+<span id="cb124-17"><a href="outcome-regression-and-propensity-scores.html#cb124-17" tabindex="-1"></a>        <span class="at">axis.ticks.y =</span> <span class="fu">element_blank</span>(),</span>
+<span id="cb124-18"><a href="outcome-regression-and-propensity-scores.html#cb124-18" tabindex="-1"></a>        <span class="at">axis.text.y =</span> <span class="fu">element_blank</span>())</span></code></pre></div>
 </div>
 <div id="program-15.3" class="section level2 hasAnchor">
 <h2>Program 15.3<a href="outcome-regression-and-propensity-scores.html#program-15.3" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -668,295 +668,295 @@ <h2>Program 15.3<a href="outcome-regression-and-propensity-scores.html#program-1
 <li>Stratification on the propensity score</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb34"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb34-1"><a href="outcome-regression-and-propensity-scores.html#cb34-1" tabindex="-1"></a><span class="co"># calculation of deciles</span></span>
-<span id="cb34-2"><a href="outcome-regression-and-propensity-scores.html#cb34-2" tabindex="-1"></a>nhefs<span class="sc">$</span>ps.dec <span class="ot">&lt;-</span> <span class="fu">cut</span>(nhefs<span class="sc">$</span>ps,</span>
-<span id="cb34-3"><a href="outcome-regression-and-propensity-scores.html#cb34-3" tabindex="-1"></a>                    <span class="at">breaks=</span><span class="fu">c</span>(<span class="fu">quantile</span>(nhefs<span class="sc">$</span>ps, <span class="at">probs=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">1</span>,<span class="fl">0.1</span>))),</span>
-<span id="cb34-4"><a href="outcome-regression-and-propensity-scores.html#cb34-4" tabindex="-1"></a>                    <span class="at">labels=</span><span class="fu">seq</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">10</span>),</span>
-<span id="cb34-5"><a href="outcome-regression-and-propensity-scores.html#cb34-5" tabindex="-1"></a>                    <span class="at">include.lowest=</span><span class="cn">TRUE</span>)</span>
-<span id="cb34-6"><a href="outcome-regression-and-propensity-scores.html#cb34-6" tabindex="-1"></a></span>
-<span id="cb34-7"><a href="outcome-regression-and-propensity-scores.html#cb34-7" tabindex="-1"></a><span class="co">#install.packages(&quot;psych&quot;) # install package if required</span></span>
-<span id="cb34-8"><a href="outcome-regression-and-propensity-scores.html#cb34-8" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;psych&quot;</span>)</span>
-<span id="cb34-9"><a href="outcome-regression-and-propensity-scores.html#cb34-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-10"><a href="outcome-regression-and-propensity-scores.html#cb34-10" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;psych&#39;</span></span>
-<span id="cb34-11"><a href="outcome-regression-and-propensity-scores.html#cb34-11" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:ggplot2&#39;:</span></span>
-<span id="cb34-12"><a href="outcome-regression-and-propensity-scores.html#cb34-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-13"><a href="outcome-regression-and-propensity-scores.html#cb34-13" tabindex="-1"></a><span class="co">#&gt;     %+%, alpha</span></span>
-<span id="cb34-14"><a href="outcome-regression-and-propensity-scores.html#cb34-14" tabindex="-1"></a><span class="fu">describeBy</span>(nhefs<span class="sc">$</span>ps, <span class="fu">list</span>(nhefs<span class="sc">$</span>ps.dec, nhefs<span class="sc">$</span>qsmk))</span>
-<span id="cb34-15"><a href="outcome-regression-and-propensity-scores.html#cb34-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-16"><a href="outcome-regression-and-propensity-scores.html#cb34-16" tabindex="-1"></a><span class="co">#&gt;  Descriptive statistics by group </span></span>
-<span id="cb34-17"><a href="outcome-regression-and-propensity-scores.html#cb34-17" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-18"><a href="outcome-regression-and-propensity-scores.html#cb34-18" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-19"><a href="outcome-regression-and-propensity-scores.html#cb34-19" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-20"><a href="outcome-regression-and-propensity-scores.html#cb34-20" tabindex="-1"></a><span class="co">#&gt; X1    1 151  0.1 0.02   0.11     0.1 0.02 0.05 0.13  0.08 -0.55    -0.53  0</span></span>
-<span id="cb34-21"><a href="outcome-regression-and-propensity-scores.html#cb34-21" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-22"><a href="outcome-regression-and-propensity-scores.html#cb34-22" tabindex="-1"></a><span class="co">#&gt; : 2</span></span>
-<span id="cb34-23"><a href="outcome-regression-and-propensity-scores.html#cb34-23" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-24"><a href="outcome-regression-and-propensity-scores.html#cb34-24" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-25"><a href="outcome-regression-and-propensity-scores.html#cb34-25" tabindex="-1"></a><span class="co">#&gt; X1    1 136 0.15 0.01   0.15    0.15 0.01 0.13 0.17  0.04 -0.04    -1.23  0</span></span>
-<span id="cb34-26"><a href="outcome-regression-and-propensity-scores.html#cb34-26" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-27"><a href="outcome-regression-and-propensity-scores.html#cb34-27" tabindex="-1"></a><span class="co">#&gt; : 3</span></span>
-<span id="cb34-28"><a href="outcome-regression-and-propensity-scores.html#cb34-28" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-29"><a href="outcome-regression-and-propensity-scores.html#cb34-29" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-30"><a href="outcome-regression-and-propensity-scores.html#cb34-30" tabindex="-1"></a><span class="co">#&gt; X1    1 134 0.18 0.01   0.18    0.18 0.01 0.17 0.19  0.03 -0.08    -1.34  0</span></span>
-<span id="cb34-31"><a href="outcome-regression-and-propensity-scores.html#cb34-31" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-32"><a href="outcome-regression-and-propensity-scores.html#cb34-32" tabindex="-1"></a><span class="co">#&gt; : 4</span></span>
-<span id="cb34-33"><a href="outcome-regression-and-propensity-scores.html#cb34-33" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-34"><a href="outcome-regression-and-propensity-scores.html#cb34-34" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-35"><a href="outcome-regression-and-propensity-scores.html#cb34-35" tabindex="-1"></a><span class="co">#&gt; X1    1 129 0.21 0.01   0.21    0.21 0.01 0.19 0.22  0.02 -0.04    -1.13  0</span></span>
-<span id="cb34-36"><a href="outcome-regression-and-propensity-scores.html#cb34-36" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-37"><a href="outcome-regression-and-propensity-scores.html#cb34-37" tabindex="-1"></a><span class="co">#&gt; : 5</span></span>
-<span id="cb34-38"><a href="outcome-regression-and-propensity-scores.html#cb34-38" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-39"><a href="outcome-regression-and-propensity-scores.html#cb34-39" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-40"><a href="outcome-regression-and-propensity-scores.html#cb34-40" tabindex="-1"></a><span class="co">#&gt; X1    1 120 0.23 0.01   0.23    0.23 0.01 0.22 0.25  0.03 0.24    -1.22  0</span></span>
-<span id="cb34-41"><a href="outcome-regression-and-propensity-scores.html#cb34-41" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-42"><a href="outcome-regression-and-propensity-scores.html#cb34-42" tabindex="-1"></a><span class="co">#&gt; : 6</span></span>
-<span id="cb34-43"><a href="outcome-regression-and-propensity-scores.html#cb34-43" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-44"><a href="outcome-regression-and-propensity-scores.html#cb34-44" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-45"><a href="outcome-regression-and-propensity-scores.html#cb34-45" tabindex="-1"></a><span class="co">#&gt; X1    1 117 0.26 0.01   0.26    0.26 0.01 0.25 0.27  0.03 -0.11    -1.29  0</span></span>
-<span id="cb34-46"><a href="outcome-regression-and-propensity-scores.html#cb34-46" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-47"><a href="outcome-regression-and-propensity-scores.html#cb34-47" tabindex="-1"></a><span class="co">#&gt; : 7</span></span>
-<span id="cb34-48"><a href="outcome-regression-and-propensity-scores.html#cb34-48" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-49"><a href="outcome-regression-and-propensity-scores.html#cb34-49" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-50"><a href="outcome-regression-and-propensity-scores.html#cb34-50" tabindex="-1"></a><span class="co">#&gt; X1    1 120 0.29 0.01   0.29    0.29 0.01 0.27 0.31  0.03 -0.23    -1.19  0</span></span>
-<span id="cb34-51"><a href="outcome-regression-and-propensity-scores.html#cb34-51" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-52"><a href="outcome-regression-and-propensity-scores.html#cb34-52" tabindex="-1"></a><span class="co">#&gt; : 8</span></span>
-<span id="cb34-53"><a href="outcome-regression-and-propensity-scores.html#cb34-53" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-54"><a href="outcome-regression-and-propensity-scores.html#cb34-54" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-55"><a href="outcome-regression-and-propensity-scores.html#cb34-55" tabindex="-1"></a><span class="co">#&gt; X1    1 112 0.33 0.01   0.33    0.33 0.02 0.31 0.35  0.04 0.15     -1.1  0</span></span>
-<span id="cb34-56"><a href="outcome-regression-and-propensity-scores.html#cb34-56" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-57"><a href="outcome-regression-and-propensity-scores.html#cb34-57" tabindex="-1"></a><span class="co">#&gt; : 9</span></span>
-<span id="cb34-58"><a href="outcome-regression-and-propensity-scores.html#cb34-58" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-59"><a href="outcome-regression-and-propensity-scores.html#cb34-59" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-60"><a href="outcome-regression-and-propensity-scores.html#cb34-60" tabindex="-1"></a><span class="co">#&gt; X1    1 96 0.38 0.02   0.38    0.38 0.02 0.35 0.42  0.06 0.13    -1.15  0</span></span>
-<span id="cb34-61"><a href="outcome-regression-and-propensity-scores.html#cb34-61" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-62"><a href="outcome-regression-and-propensity-scores.html#cb34-62" tabindex="-1"></a><span class="co">#&gt; : 10</span></span>
-<span id="cb34-63"><a href="outcome-regression-and-propensity-scores.html#cb34-63" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
-<span id="cb34-64"><a href="outcome-regression-and-propensity-scores.html#cb34-64" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
-<span id="cb34-65"><a href="outcome-regression-and-propensity-scores.html#cb34-65" tabindex="-1"></a><span class="co">#&gt; X1    1 86 0.49 0.06   0.47    0.48 0.05 0.42 0.66  0.24  1.1     0.47 0.01</span></span>
-<span id="cb34-66"><a href="outcome-regression-and-propensity-scores.html#cb34-66" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-67"><a href="outcome-regression-and-propensity-scores.html#cb34-67" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-68"><a href="outcome-regression-and-propensity-scores.html#cb34-68" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-69"><a href="outcome-regression-and-propensity-scores.html#cb34-69" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
-<span id="cb34-70"><a href="outcome-regression-and-propensity-scores.html#cb34-70" tabindex="-1"></a><span class="co">#&gt; X1    1 12  0.1 0.02   0.11     0.1 0.03 0.06 0.13  0.07 -0.5    -1.36 0.01</span></span>
-<span id="cb34-71"><a href="outcome-regression-and-propensity-scores.html#cb34-71" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-72"><a href="outcome-regression-and-propensity-scores.html#cb34-72" tabindex="-1"></a><span class="co">#&gt; : 2</span></span>
-<span id="cb34-73"><a href="outcome-regression-and-propensity-scores.html#cb34-73" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-74"><a href="outcome-regression-and-propensity-scores.html#cb34-74" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-75"><a href="outcome-regression-and-propensity-scores.html#cb34-75" tabindex="-1"></a><span class="co">#&gt; X1    1 27 0.15 0.01   0.15    0.15 0.01 0.13 0.17  0.03 -0.03    -1.34  0</span></span>
-<span id="cb34-76"><a href="outcome-regression-and-propensity-scores.html#cb34-76" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-77"><a href="outcome-regression-and-propensity-scores.html#cb34-77" tabindex="-1"></a><span class="co">#&gt; : 3</span></span>
-<span id="cb34-78"><a href="outcome-regression-and-propensity-scores.html#cb34-78" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-79"><a href="outcome-regression-and-propensity-scores.html#cb34-79" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-80"><a href="outcome-regression-and-propensity-scores.html#cb34-80" tabindex="-1"></a><span class="co">#&gt; X1    1 29 0.18 0.01   0.18    0.18 0.01 0.17 0.19  0.03 0.01    -1.34  0</span></span>
-<span id="cb34-81"><a href="outcome-regression-and-propensity-scores.html#cb34-81" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-82"><a href="outcome-regression-and-propensity-scores.html#cb34-82" tabindex="-1"></a><span class="co">#&gt; : 4</span></span>
-<span id="cb34-83"><a href="outcome-regression-and-propensity-scores.html#cb34-83" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-84"><a href="outcome-regression-and-propensity-scores.html#cb34-84" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
-<span id="cb34-85"><a href="outcome-regression-and-propensity-scores.html#cb34-85" tabindex="-1"></a><span class="co">#&gt; X1    1 34 0.21 0.01   0.21    0.21 0.01 0.19 0.22  0.02 -0.31    -1.23  0</span></span>
-<span id="cb34-86"><a href="outcome-regression-and-propensity-scores.html#cb34-86" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-87"><a href="outcome-regression-and-propensity-scores.html#cb34-87" tabindex="-1"></a><span class="co">#&gt; : 5</span></span>
-<span id="cb34-88"><a href="outcome-regression-and-propensity-scores.html#cb34-88" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-89"><a href="outcome-regression-and-propensity-scores.html#cb34-89" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-90"><a href="outcome-regression-and-propensity-scores.html#cb34-90" tabindex="-1"></a><span class="co">#&gt; X1    1 43 0.23 0.01   0.23    0.23 0.01 0.22 0.25  0.03 0.11    -1.23  0</span></span>
-<span id="cb34-91"><a href="outcome-regression-and-propensity-scores.html#cb34-91" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-92"><a href="outcome-regression-and-propensity-scores.html#cb34-92" tabindex="-1"></a><span class="co">#&gt; : 6</span></span>
-<span id="cb34-93"><a href="outcome-regression-and-propensity-scores.html#cb34-93" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-94"><a href="outcome-regression-and-propensity-scores.html#cb34-94" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-95"><a href="outcome-regression-and-propensity-scores.html#cb34-95" tabindex="-1"></a><span class="co">#&gt; X1    1 45 0.26 0.01   0.26    0.26 0.01 0.25 0.27  0.03  0.2    -1.12  0</span></span>
-<span id="cb34-96"><a href="outcome-regression-and-propensity-scores.html#cb34-96" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-97"><a href="outcome-regression-and-propensity-scores.html#cb34-97" tabindex="-1"></a><span class="co">#&gt; : 7</span></span>
-<span id="cb34-98"><a href="outcome-regression-and-propensity-scores.html#cb34-98" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-99"><a href="outcome-regression-and-propensity-scores.html#cb34-99" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-100"><a href="outcome-regression-and-propensity-scores.html#cb34-100" tabindex="-1"></a><span class="co">#&gt; X1    1 43 0.29 0.01   0.29    0.29 0.01 0.27 0.31  0.03 0.16    -1.25  0</span></span>
-<span id="cb34-101"><a href="outcome-regression-and-propensity-scores.html#cb34-101" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-102"><a href="outcome-regression-and-propensity-scores.html#cb34-102" tabindex="-1"></a><span class="co">#&gt; : 8</span></span>
-<span id="cb34-103"><a href="outcome-regression-and-propensity-scores.html#cb34-103" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-104"><a href="outcome-regression-and-propensity-scores.html#cb34-104" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-105"><a href="outcome-regression-and-propensity-scores.html#cb34-105" tabindex="-1"></a><span class="co">#&gt; X1    1 51 0.33 0.01   0.33    0.33 0.02 0.31 0.35  0.04 0.11    -1.19  0</span></span>
-<span id="cb34-106"><a href="outcome-regression-and-propensity-scores.html#cb34-106" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-107"><a href="outcome-regression-and-propensity-scores.html#cb34-107" tabindex="-1"></a><span class="co">#&gt; : 9</span></span>
-<span id="cb34-108"><a href="outcome-regression-and-propensity-scores.html#cb34-108" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-109"><a href="outcome-regression-and-propensity-scores.html#cb34-109" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
-<span id="cb34-110"><a href="outcome-regression-and-propensity-scores.html#cb34-110" tabindex="-1"></a><span class="co">#&gt; X1    1 67 0.38 0.02   0.38    0.38 0.03 0.35 0.42  0.06 0.19    -1.27  0</span></span>
-<span id="cb34-111"><a href="outcome-regression-and-propensity-scores.html#cb34-111" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
-<span id="cb34-112"><a href="outcome-regression-and-propensity-scores.html#cb34-112" tabindex="-1"></a><span class="co">#&gt; : 10</span></span>
-<span id="cb34-113"><a href="outcome-regression-and-propensity-scores.html#cb34-113" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
-<span id="cb34-114"><a href="outcome-regression-and-propensity-scores.html#cb34-114" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
-<span id="cb34-115"><a href="outcome-regression-and-propensity-scores.html#cb34-115" tabindex="-1"></a><span class="co">#&gt; X1    1 77 0.52 0.08   0.51    0.51 0.08 0.42 0.79  0.38 0.88     0.81 0.01</span></span>
-<span id="cb34-116"><a href="outcome-regression-and-propensity-scores.html#cb34-116" tabindex="-1"></a></span>
-<span id="cb34-117"><a href="outcome-regression-and-propensity-scores.html#cb34-117" tabindex="-1"></a><span class="co"># function to create deciles easily</span></span>
-<span id="cb34-118"><a href="outcome-regression-and-propensity-scores.html#cb34-118" tabindex="-1"></a>decile <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {</span>
-<span id="cb34-119"><a href="outcome-regression-and-propensity-scores.html#cb34-119" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">factor</span>(<span class="fu">quantcut</span>(x, <span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="fl">0.1</span>), <span class="at">labels =</span> <span class="cn">FALSE</span>)))</span>
-<span id="cb34-120"><a href="outcome-regression-and-propensity-scores.html#cb34-120" tabindex="-1"></a>}</span>
-<span id="cb34-121"><a href="outcome-regression-and-propensity-scores.html#cb34-121" tabindex="-1"></a></span>
-<span id="cb34-122"><a href="outcome-regression-and-propensity-scores.html#cb34-122" tabindex="-1"></a><span class="co"># regression on PS deciles, allowing for effect modification</span></span>
-<span id="cb34-123"><a href="outcome-regression-and-propensity-scores.html#cb34-123" tabindex="-1"></a><span class="cf">for</span> (deciles <span class="cf">in</span> <span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">10</span>)) {</span>
-<span id="cb34-124"><a href="outcome-regression-and-propensity-scores.html#cb34-124" tabindex="-1"></a>  <span class="fu">print</span>(<span class="fu">t.test</span>(wt82_71<span class="sc">~</span>qsmk, <span class="at">data=</span>nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>ps.dec<span class="sc">==</span>deciles),]))</span>
-<span id="cb34-125"><a href="outcome-regression-and-propensity-scores.html#cb34-125" tabindex="-1"></a>}</span>
-<span id="cb34-126"><a href="outcome-regression-and-propensity-scores.html#cb34-126" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-127"><a href="outcome-regression-and-propensity-scores.html#cb34-127" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-128"><a href="outcome-regression-and-propensity-scores.html#cb34-128" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-129"><a href="outcome-regression-and-propensity-scores.html#cb34-129" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-130"><a href="outcome-regression-and-propensity-scores.html#cb34-130" tabindex="-1"></a><span class="co">#&gt; t = 0.0060506, df = 11.571, p-value = 0.9953</span></span>
-<span id="cb34-131"><a href="outcome-regression-and-propensity-scores.html#cb34-131" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-132"><a href="outcome-regression-and-propensity-scores.html#cb34-132" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-133"><a href="outcome-regression-and-propensity-scores.html#cb34-133" tabindex="-1"></a><span class="co">#&gt;  -5.283903  5.313210</span></span>
-<span id="cb34-134"><a href="outcome-regression-and-propensity-scores.html#cb34-134" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-135"><a href="outcome-regression-and-propensity-scores.html#cb34-135" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-136"><a href="outcome-regression-and-propensity-scores.html#cb34-136" tabindex="-1"></a><span class="co">#&gt;        3.995205        3.980551 </span></span>
-<span id="cb34-137"><a href="outcome-regression-and-propensity-scores.html#cb34-137" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-138"><a href="outcome-regression-and-propensity-scores.html#cb34-138" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-139"><a href="outcome-regression-and-propensity-scores.html#cb34-139" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-140"><a href="outcome-regression-and-propensity-scores.html#cb34-140" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-141"><a href="outcome-regression-and-propensity-scores.html#cb34-141" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-142"><a href="outcome-regression-and-propensity-scores.html#cb34-142" tabindex="-1"></a><span class="co">#&gt; t = -3.1117, df = 37.365, p-value = 0.003556</span></span>
-<span id="cb34-143"><a href="outcome-regression-and-propensity-scores.html#cb34-143" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-144"><a href="outcome-regression-and-propensity-scores.html#cb34-144" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-145"><a href="outcome-regression-and-propensity-scores.html#cb34-145" tabindex="-1"></a><span class="co">#&gt;  -6.849335 -1.448161</span></span>
-<span id="cb34-146"><a href="outcome-regression-and-propensity-scores.html#cb34-146" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-147"><a href="outcome-regression-and-propensity-scores.html#cb34-147" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-148"><a href="outcome-regression-and-propensity-scores.html#cb34-148" tabindex="-1"></a><span class="co">#&gt;        2.904679        7.053426 </span></span>
-<span id="cb34-149"><a href="outcome-regression-and-propensity-scores.html#cb34-149" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-150"><a href="outcome-regression-and-propensity-scores.html#cb34-150" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-151"><a href="outcome-regression-and-propensity-scores.html#cb34-151" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-152"><a href="outcome-regression-and-propensity-scores.html#cb34-152" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-153"><a href="outcome-regression-and-propensity-scores.html#cb34-153" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-154"><a href="outcome-regression-and-propensity-scores.html#cb34-154" tabindex="-1"></a><span class="co">#&gt; t = -4.5301, df = 35.79, p-value = 6.317e-05</span></span>
-<span id="cb34-155"><a href="outcome-regression-and-propensity-scores.html#cb34-155" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-156"><a href="outcome-regression-and-propensity-scores.html#cb34-156" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-157"><a href="outcome-regression-and-propensity-scores.html#cb34-157" tabindex="-1"></a><span class="co">#&gt;  -9.474961 -3.613990</span></span>
-<span id="cb34-158"><a href="outcome-regression-and-propensity-scores.html#cb34-158" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-159"><a href="outcome-regression-and-propensity-scores.html#cb34-159" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-160"><a href="outcome-regression-and-propensity-scores.html#cb34-160" tabindex="-1"></a><span class="co">#&gt;        2.612094        9.156570 </span></span>
-<span id="cb34-161"><a href="outcome-regression-and-propensity-scores.html#cb34-161" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-162"><a href="outcome-regression-and-propensity-scores.html#cb34-162" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-163"><a href="outcome-regression-and-propensity-scores.html#cb34-163" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-164"><a href="outcome-regression-and-propensity-scores.html#cb34-164" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-165"><a href="outcome-regression-and-propensity-scores.html#cb34-165" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-166"><a href="outcome-regression-and-propensity-scores.html#cb34-166" tabindex="-1"></a><span class="co">#&gt; t = -1.4117, df = 45.444, p-value = 0.1648</span></span>
-<span id="cb34-167"><a href="outcome-regression-and-propensity-scores.html#cb34-167" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-168"><a href="outcome-regression-and-propensity-scores.html#cb34-168" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-169"><a href="outcome-regression-and-propensity-scores.html#cb34-169" tabindex="-1"></a><span class="co">#&gt;  -5.6831731  0.9985715</span></span>
-<span id="cb34-170"><a href="outcome-regression-and-propensity-scores.html#cb34-170" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-171"><a href="outcome-regression-and-propensity-scores.html#cb34-171" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-172"><a href="outcome-regression-and-propensity-scores.html#cb34-172" tabindex="-1"></a><span class="co">#&gt;        3.474679        5.816979 </span></span>
-<span id="cb34-173"><a href="outcome-regression-and-propensity-scores.html#cb34-173" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-174"><a href="outcome-regression-and-propensity-scores.html#cb34-174" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-175"><a href="outcome-regression-and-propensity-scores.html#cb34-175" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-176"><a href="outcome-regression-and-propensity-scores.html#cb34-176" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-177"><a href="outcome-regression-and-propensity-scores.html#cb34-177" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-178"><a href="outcome-regression-and-propensity-scores.html#cb34-178" tabindex="-1"></a><span class="co">#&gt; t = -3.1371, df = 74.249, p-value = 0.002446</span></span>
-<span id="cb34-179"><a href="outcome-regression-and-propensity-scores.html#cb34-179" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-180"><a href="outcome-regression-and-propensity-scores.html#cb34-180" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-181"><a href="outcome-regression-and-propensity-scores.html#cb34-181" tabindex="-1"></a><span class="co">#&gt;  -6.753621 -1.507087</span></span>
-<span id="cb34-182"><a href="outcome-regression-and-propensity-scores.html#cb34-182" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-183"><a href="outcome-regression-and-propensity-scores.html#cb34-183" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-184"><a href="outcome-regression-and-propensity-scores.html#cb34-184" tabindex="-1"></a><span class="co">#&gt;        2.098800        6.229154 </span></span>
-<span id="cb34-185"><a href="outcome-regression-and-propensity-scores.html#cb34-185" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-186"><a href="outcome-regression-and-propensity-scores.html#cb34-186" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-187"><a href="outcome-regression-and-propensity-scores.html#cb34-187" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-188"><a href="outcome-regression-and-propensity-scores.html#cb34-188" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-189"><a href="outcome-regression-and-propensity-scores.html#cb34-189" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-190"><a href="outcome-regression-and-propensity-scores.html#cb34-190" tabindex="-1"></a><span class="co">#&gt; t = -2.1677, df = 50.665, p-value = 0.0349</span></span>
-<span id="cb34-191"><a href="outcome-regression-and-propensity-scores.html#cb34-191" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-192"><a href="outcome-regression-and-propensity-scores.html#cb34-192" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-193"><a href="outcome-regression-and-propensity-scores.html#cb34-193" tabindex="-1"></a><span class="co">#&gt;  -8.7516605 -0.3350127</span></span>
-<span id="cb34-194"><a href="outcome-regression-and-propensity-scores.html#cb34-194" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-195"><a href="outcome-regression-and-propensity-scores.html#cb34-195" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-196"><a href="outcome-regression-and-propensity-scores.html#cb34-196" tabindex="-1"></a><span class="co">#&gt;        1.847004        6.390340 </span></span>
-<span id="cb34-197"><a href="outcome-regression-and-propensity-scores.html#cb34-197" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-198"><a href="outcome-regression-and-propensity-scores.html#cb34-198" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-199"><a href="outcome-regression-and-propensity-scores.html#cb34-199" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-200"><a href="outcome-regression-and-propensity-scores.html#cb34-200" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-201"><a href="outcome-regression-and-propensity-scores.html#cb34-201" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-202"><a href="outcome-regression-and-propensity-scores.html#cb34-202" tabindex="-1"></a><span class="co">#&gt; t = -3.3155, df = 84.724, p-value = 0.001348</span></span>
-<span id="cb34-203"><a href="outcome-regression-and-propensity-scores.html#cb34-203" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-204"><a href="outcome-regression-and-propensity-scores.html#cb34-204" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-205"><a href="outcome-regression-and-propensity-scores.html#cb34-205" tabindex="-1"></a><span class="co">#&gt;  -6.904207 -1.727590</span></span>
-<span id="cb34-206"><a href="outcome-regression-and-propensity-scores.html#cb34-206" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-207"><a href="outcome-regression-and-propensity-scores.html#cb34-207" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-208"><a href="outcome-regression-and-propensity-scores.html#cb34-208" tabindex="-1"></a><span class="co">#&gt;        1.560048        5.875946 </span></span>
-<span id="cb34-209"><a href="outcome-regression-and-propensity-scores.html#cb34-209" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-210"><a href="outcome-regression-and-propensity-scores.html#cb34-210" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-211"><a href="outcome-regression-and-propensity-scores.html#cb34-211" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-212"><a href="outcome-regression-and-propensity-scores.html#cb34-212" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-213"><a href="outcome-regression-and-propensity-scores.html#cb34-213" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-214"><a href="outcome-regression-and-propensity-scores.html#cb34-214" tabindex="-1"></a><span class="co">#&gt; t = -2.664, df = 75.306, p-value = 0.009441</span></span>
-<span id="cb34-215"><a href="outcome-regression-and-propensity-scores.html#cb34-215" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-216"><a href="outcome-regression-and-propensity-scores.html#cb34-216" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-217"><a href="outcome-regression-and-propensity-scores.html#cb34-217" tabindex="-1"></a><span class="co">#&gt;  -6.2396014 -0.9005605</span></span>
-<span id="cb34-218"><a href="outcome-regression-and-propensity-scores.html#cb34-218" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-219"><a href="outcome-regression-and-propensity-scores.html#cb34-219" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-220"><a href="outcome-regression-and-propensity-scores.html#cb34-220" tabindex="-1"></a><span class="co">#&gt;       0.2846851       3.8547661 </span></span>
-<span id="cb34-221"><a href="outcome-regression-and-propensity-scores.html#cb34-221" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-222"><a href="outcome-regression-and-propensity-scores.html#cb34-222" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-223"><a href="outcome-regression-and-propensity-scores.html#cb34-223" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-224"><a href="outcome-regression-and-propensity-scores.html#cb34-224" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-225"><a href="outcome-regression-and-propensity-scores.html#cb34-225" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-226"><a href="outcome-regression-and-propensity-scores.html#cb34-226" tabindex="-1"></a><span class="co">#&gt; t = -1.9122, df = 129.12, p-value = 0.05806</span></span>
-<span id="cb34-227"><a href="outcome-regression-and-propensity-scores.html#cb34-227" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-228"><a href="outcome-regression-and-propensity-scores.html#cb34-228" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-229"><a href="outcome-regression-and-propensity-scores.html#cb34-229" tabindex="-1"></a><span class="co">#&gt;  -4.68143608  0.07973698</span></span>
-<span id="cb34-230"><a href="outcome-regression-and-propensity-scores.html#cb34-230" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-231"><a href="outcome-regression-and-propensity-scores.html#cb34-231" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-232"><a href="outcome-regression-and-propensity-scores.html#cb34-232" tabindex="-1"></a><span class="co">#&gt;      -0.8954482       1.4054014 </span></span>
-<span id="cb34-233"><a href="outcome-regression-and-propensity-scores.html#cb34-233" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-234"><a href="outcome-regression-and-propensity-scores.html#cb34-234" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-235"><a href="outcome-regression-and-propensity-scores.html#cb34-235" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
-<span id="cb34-236"><a href="outcome-regression-and-propensity-scores.html#cb34-236" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-237"><a href="outcome-regression-and-propensity-scores.html#cb34-237" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
-<span id="cb34-238"><a href="outcome-regression-and-propensity-scores.html#cb34-238" tabindex="-1"></a><span class="co">#&gt; t = -1.5925, df = 142.72, p-value = 0.1135</span></span>
-<span id="cb34-239"><a href="outcome-regression-and-propensity-scores.html#cb34-239" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
-<span id="cb34-240"><a href="outcome-regression-and-propensity-scores.html#cb34-240" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
-<span id="cb34-241"><a href="outcome-regression-and-propensity-scores.html#cb34-241" tabindex="-1"></a><span class="co">#&gt;  -5.0209284  0.5404697</span></span>
-<span id="cb34-242"><a href="outcome-regression-and-propensity-scores.html#cb34-242" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
-<span id="cb34-243"><a href="outcome-regression-and-propensity-scores.html#cb34-243" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
-<span id="cb34-244"><a href="outcome-regression-and-propensity-scores.html#cb34-244" tabindex="-1"></a><span class="co">#&gt;      -0.5043766       1.7358528</span></span>
-<span id="cb34-245"><a href="outcome-regression-and-propensity-scores.html#cb34-245" tabindex="-1"></a></span>
-<span id="cb34-246"><a href="outcome-regression-and-propensity-scores.html#cb34-246" tabindex="-1"></a><span class="co"># regression on PS deciles, not allowing for effect modification</span></span>
-<span id="cb34-247"><a href="outcome-regression-and-propensity-scores.html#cb34-247" tabindex="-1"></a>fit.psdec <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">as.factor</span>(ps.dec), <span class="at">data =</span> nhefs)</span>
-<span id="cb34-248"><a href="outcome-regression-and-propensity-scores.html#cb34-248" tabindex="-1"></a><span class="fu">summary</span>(fit.psdec)</span>
-<span id="cb34-249"><a href="outcome-regression-and-propensity-scores.html#cb34-249" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-250"><a href="outcome-regression-and-propensity-scores.html#cb34-250" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb34-251"><a href="outcome-regression-and-propensity-scores.html#cb34-251" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs)</span></span>
-<span id="cb34-252"><a href="outcome-regression-and-propensity-scores.html#cb34-252" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-253"><a href="outcome-regression-and-propensity-scores.html#cb34-253" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb34-254"><a href="outcome-regression-and-propensity-scores.html#cb34-254" tabindex="-1"></a><span class="co">#&gt;                     Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb34-255"><a href="outcome-regression-and-propensity-scores.html#cb34-255" tabindex="-1"></a><span class="co">#&gt; (Intercept)           3.7505     0.6089   6.159 9.29e-10 ***</span></span>
-<span id="cb34-256"><a href="outcome-regression-and-propensity-scores.html#cb34-256" tabindex="-1"></a><span class="co">#&gt; qsmk                  3.5005     0.4571   7.659 3.28e-14 ***</span></span>
-<span id="cb34-257"><a href="outcome-regression-and-propensity-scores.html#cb34-257" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)2   -0.7391     0.8611  -0.858   0.3908    </span></span>
-<span id="cb34-258"><a href="outcome-regression-and-propensity-scores.html#cb34-258" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)3   -0.6182     0.8612  -0.718   0.4730    </span></span>
-<span id="cb34-259"><a href="outcome-regression-and-propensity-scores.html#cb34-259" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)4   -0.5204     0.8584  -0.606   0.5444    </span></span>
-<span id="cb34-260"><a href="outcome-regression-and-propensity-scores.html#cb34-260" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)5   -1.4884     0.8590  -1.733   0.0834 .  </span></span>
-<span id="cb34-261"><a href="outcome-regression-and-propensity-scores.html#cb34-261" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)6   -1.6227     0.8675  -1.871   0.0616 .  </span></span>
-<span id="cb34-262"><a href="outcome-regression-and-propensity-scores.html#cb34-262" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)7   -1.9853     0.8681  -2.287   0.0223 *  </span></span>
-<span id="cb34-263"><a href="outcome-regression-and-propensity-scores.html#cb34-263" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)8   -3.4447     0.8749  -3.937 8.61e-05 ***</span></span>
-<span id="cb34-264"><a href="outcome-regression-and-propensity-scores.html#cb34-264" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)9   -5.1544     0.8848  -5.825 6.91e-09 ***</span></span>
-<span id="cb34-265"><a href="outcome-regression-and-propensity-scores.html#cb34-265" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)10  -4.8403     0.8828  -5.483 4.87e-08 ***</span></span>
-<span id="cb34-266"><a href="outcome-regression-and-propensity-scores.html#cb34-266" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb34-267"><a href="outcome-regression-and-propensity-scores.html#cb34-267" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb34-268"><a href="outcome-regression-and-propensity-scores.html#cb34-268" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-269"><a href="outcome-regression-and-propensity-scores.html#cb34-269" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 58.42297)</span></span>
-<span id="cb34-270"><a href="outcome-regression-and-propensity-scores.html#cb34-270" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-271"><a href="outcome-regression-and-propensity-scores.html#cb34-271" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb34-272"><a href="outcome-regression-and-propensity-scores.html#cb34-272" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 90848  on 1555  degrees of freedom</span></span>
-<span id="cb34-273"><a href="outcome-regression-and-propensity-scores.html#cb34-273" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb34-274"><a href="outcome-regression-and-propensity-scores.html#cb34-274" tabindex="-1"></a><span class="co">#&gt; AIC: 10827</span></span>
-<span id="cb34-275"><a href="outcome-regression-and-propensity-scores.html#cb34-275" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb34-276"><a href="outcome-regression-and-propensity-scores.html#cb34-276" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb34-277"><a href="outcome-regression-and-propensity-scores.html#cb34-277" tabindex="-1"></a><span class="fu">confint.lm</span>(fit.psdec)</span>
-<span id="cb34-278"><a href="outcome-regression-and-propensity-scores.html#cb34-278" tabindex="-1"></a><span class="co">#&gt;                         2.5 %      97.5 %</span></span>
-<span id="cb34-279"><a href="outcome-regression-and-propensity-scores.html#cb34-279" tabindex="-1"></a><span class="co">#&gt; (Intercept)          2.556098  4.94486263</span></span>
-<span id="cb34-280"><a href="outcome-regression-and-propensity-scores.html#cb34-280" tabindex="-1"></a><span class="co">#&gt; qsmk                 2.603953  4.39700504</span></span>
-<span id="cb34-281"><a href="outcome-regression-and-propensity-scores.html#cb34-281" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)2  -2.428074  0.94982494</span></span>
-<span id="cb34-282"><a href="outcome-regression-and-propensity-scores.html#cb34-282" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)3  -2.307454  1.07103569</span></span>
-<span id="cb34-283"><a href="outcome-regression-and-propensity-scores.html#cb34-283" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)4  -2.204103  1.16333143</span></span>
-<span id="cb34-284"><a href="outcome-regression-and-propensity-scores.html#cb34-284" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)5  -3.173337  0.19657938</span></span>
-<span id="cb34-285"><a href="outcome-regression-and-propensity-scores.html#cb34-285" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)6  -3.324345  0.07893027</span></span>
-<span id="cb34-286"><a href="outcome-regression-and-propensity-scores.html#cb34-286" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)7  -3.688043 -0.28248110</span></span>
-<span id="cb34-287"><a href="outcome-regression-and-propensity-scores.html#cb34-287" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)8  -5.160862 -1.72860113</span></span>
-<span id="cb34-288"><a href="outcome-regression-and-propensity-scores.html#cb34-288" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)9  -6.889923 -3.41883853</span></span>
-<span id="cb34-289"><a href="outcome-regression-and-propensity-scores.html#cb34-289" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)10 -6.571789 -3.10873731</span></span></code></pre></div>
+<div class="sourceCode" id="cb125"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb125-1"><a href="outcome-regression-and-propensity-scores.html#cb125-1" tabindex="-1"></a><span class="co"># calculation of deciles</span></span>
+<span id="cb125-2"><a href="outcome-regression-and-propensity-scores.html#cb125-2" tabindex="-1"></a>nhefs<span class="sc">$</span>ps.dec <span class="ot">&lt;-</span> <span class="fu">cut</span>(nhefs<span class="sc">$</span>ps,</span>
+<span id="cb125-3"><a href="outcome-regression-and-propensity-scores.html#cb125-3" tabindex="-1"></a>                    <span class="at">breaks=</span><span class="fu">c</span>(<span class="fu">quantile</span>(nhefs<span class="sc">$</span>ps, <span class="at">probs=</span><span class="fu">seq</span>(<span class="dv">0</span>,<span class="dv">1</span>,<span class="fl">0.1</span>))),</span>
+<span id="cb125-4"><a href="outcome-regression-and-propensity-scores.html#cb125-4" tabindex="-1"></a>                    <span class="at">labels=</span><span class="fu">seq</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">10</span>),</span>
+<span id="cb125-5"><a href="outcome-regression-and-propensity-scores.html#cb125-5" tabindex="-1"></a>                    <span class="at">include.lowest=</span><span class="cn">TRUE</span>)</span>
+<span id="cb125-6"><a href="outcome-regression-and-propensity-scores.html#cb125-6" tabindex="-1"></a></span>
+<span id="cb125-7"><a href="outcome-regression-and-propensity-scores.html#cb125-7" tabindex="-1"></a><span class="co">#install.packages(&quot;psych&quot;) # install package if required</span></span>
+<span id="cb125-8"><a href="outcome-regression-and-propensity-scores.html#cb125-8" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;psych&quot;</span>)</span>
+<span id="cb125-9"><a href="outcome-regression-and-propensity-scores.html#cb125-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb125-10"><a href="outcome-regression-and-propensity-scores.html#cb125-10" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;psych&#39;</span></span>
+<span id="cb125-11"><a href="outcome-regression-and-propensity-scores.html#cb125-11" tabindex="-1"></a><span class="co">#&gt; The following objects are masked from &#39;package:ggplot2&#39;:</span></span>
+<span id="cb125-12"><a href="outcome-regression-and-propensity-scores.html#cb125-12" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb125-13"><a href="outcome-regression-and-propensity-scores.html#cb125-13" tabindex="-1"></a><span class="co">#&gt;     %+%, alpha</span></span></code></pre></div>
+<div class="sourceCode" id="cb126"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb126-1"><a href="outcome-regression-and-propensity-scores.html#cb126-1" tabindex="-1"></a><span class="fu">describeBy</span>(nhefs<span class="sc">$</span>ps, <span class="fu">list</span>(nhefs<span class="sc">$</span>ps.dec, nhefs<span class="sc">$</span>qsmk))</span>
+<span id="cb126-2"><a href="outcome-regression-and-propensity-scores.html#cb126-2" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb126-3"><a href="outcome-regression-and-propensity-scores.html#cb126-3" tabindex="-1"></a><span class="co">#&gt;  Descriptive statistics by group </span></span>
+<span id="cb126-4"><a href="outcome-regression-and-propensity-scores.html#cb126-4" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-5"><a href="outcome-regression-and-propensity-scores.html#cb126-5" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-6"><a href="outcome-regression-and-propensity-scores.html#cb126-6" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-7"><a href="outcome-regression-and-propensity-scores.html#cb126-7" tabindex="-1"></a><span class="co">#&gt; X1    1 151  0.1 0.02   0.11     0.1 0.02 0.05 0.13  0.08 -0.55    -0.53  0</span></span>
+<span id="cb126-8"><a href="outcome-regression-and-propensity-scores.html#cb126-8" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-9"><a href="outcome-regression-and-propensity-scores.html#cb126-9" tabindex="-1"></a><span class="co">#&gt; : 2</span></span>
+<span id="cb126-10"><a href="outcome-regression-and-propensity-scores.html#cb126-10" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-11"><a href="outcome-regression-and-propensity-scores.html#cb126-11" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-12"><a href="outcome-regression-and-propensity-scores.html#cb126-12" tabindex="-1"></a><span class="co">#&gt; X1    1 136 0.15 0.01   0.15    0.15 0.01 0.13 0.17  0.04 -0.04    -1.23  0</span></span>
+<span id="cb126-13"><a href="outcome-regression-and-propensity-scores.html#cb126-13" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-14"><a href="outcome-regression-and-propensity-scores.html#cb126-14" tabindex="-1"></a><span class="co">#&gt; : 3</span></span>
+<span id="cb126-15"><a href="outcome-regression-and-propensity-scores.html#cb126-15" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-16"><a href="outcome-regression-and-propensity-scores.html#cb126-16" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-17"><a href="outcome-regression-and-propensity-scores.html#cb126-17" tabindex="-1"></a><span class="co">#&gt; X1    1 134 0.18 0.01   0.18    0.18 0.01 0.17 0.19  0.03 -0.08    -1.34  0</span></span>
+<span id="cb126-18"><a href="outcome-regression-and-propensity-scores.html#cb126-18" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-19"><a href="outcome-regression-and-propensity-scores.html#cb126-19" tabindex="-1"></a><span class="co">#&gt; : 4</span></span>
+<span id="cb126-20"><a href="outcome-regression-and-propensity-scores.html#cb126-20" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-21"><a href="outcome-regression-and-propensity-scores.html#cb126-21" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-22"><a href="outcome-regression-and-propensity-scores.html#cb126-22" tabindex="-1"></a><span class="co">#&gt; X1    1 129 0.21 0.01   0.21    0.21 0.01 0.19 0.22  0.02 -0.04    -1.13  0</span></span>
+<span id="cb126-23"><a href="outcome-regression-and-propensity-scores.html#cb126-23" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-24"><a href="outcome-regression-and-propensity-scores.html#cb126-24" tabindex="-1"></a><span class="co">#&gt; : 5</span></span>
+<span id="cb126-25"><a href="outcome-regression-and-propensity-scores.html#cb126-25" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-26"><a href="outcome-regression-and-propensity-scores.html#cb126-26" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-27"><a href="outcome-regression-and-propensity-scores.html#cb126-27" tabindex="-1"></a><span class="co">#&gt; X1    1 120 0.23 0.01   0.23    0.23 0.01 0.22 0.25  0.03 0.24    -1.22  0</span></span>
+<span id="cb126-28"><a href="outcome-regression-and-propensity-scores.html#cb126-28" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-29"><a href="outcome-regression-and-propensity-scores.html#cb126-29" tabindex="-1"></a><span class="co">#&gt; : 6</span></span>
+<span id="cb126-30"><a href="outcome-regression-and-propensity-scores.html#cb126-30" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-31"><a href="outcome-regression-and-propensity-scores.html#cb126-31" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-32"><a href="outcome-regression-and-propensity-scores.html#cb126-32" tabindex="-1"></a><span class="co">#&gt; X1    1 117 0.26 0.01   0.26    0.26 0.01 0.25 0.27  0.03 -0.11    -1.29  0</span></span>
+<span id="cb126-33"><a href="outcome-regression-and-propensity-scores.html#cb126-33" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-34"><a href="outcome-regression-and-propensity-scores.html#cb126-34" tabindex="-1"></a><span class="co">#&gt; : 7</span></span>
+<span id="cb126-35"><a href="outcome-regression-and-propensity-scores.html#cb126-35" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-36"><a href="outcome-regression-and-propensity-scores.html#cb126-36" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-37"><a href="outcome-regression-and-propensity-scores.html#cb126-37" tabindex="-1"></a><span class="co">#&gt; X1    1 120 0.29 0.01   0.29    0.29 0.01 0.27 0.31  0.03 -0.23    -1.19  0</span></span>
+<span id="cb126-38"><a href="outcome-regression-and-propensity-scores.html#cb126-38" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-39"><a href="outcome-regression-and-propensity-scores.html#cb126-39" tabindex="-1"></a><span class="co">#&gt; : 8</span></span>
+<span id="cb126-40"><a href="outcome-regression-and-propensity-scores.html#cb126-40" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-41"><a href="outcome-regression-and-propensity-scores.html#cb126-41" tabindex="-1"></a><span class="co">#&gt;    vars   n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-42"><a href="outcome-regression-and-propensity-scores.html#cb126-42" tabindex="-1"></a><span class="co">#&gt; X1    1 112 0.33 0.01   0.33    0.33 0.02 0.31 0.35  0.04 0.15     -1.1  0</span></span>
+<span id="cb126-43"><a href="outcome-regression-and-propensity-scores.html#cb126-43" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-44"><a href="outcome-regression-and-propensity-scores.html#cb126-44" tabindex="-1"></a><span class="co">#&gt; : 9</span></span>
+<span id="cb126-45"><a href="outcome-regression-and-propensity-scores.html#cb126-45" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-46"><a href="outcome-regression-and-propensity-scores.html#cb126-46" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-47"><a href="outcome-regression-and-propensity-scores.html#cb126-47" tabindex="-1"></a><span class="co">#&gt; X1    1 96 0.38 0.02   0.38    0.38 0.02 0.35 0.42  0.06 0.13    -1.15  0</span></span>
+<span id="cb126-48"><a href="outcome-regression-and-propensity-scores.html#cb126-48" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-49"><a href="outcome-regression-and-propensity-scores.html#cb126-49" tabindex="-1"></a><span class="co">#&gt; : 10</span></span>
+<span id="cb126-50"><a href="outcome-regression-and-propensity-scores.html#cb126-50" tabindex="-1"></a><span class="co">#&gt; : 0</span></span>
+<span id="cb126-51"><a href="outcome-regression-and-propensity-scores.html#cb126-51" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
+<span id="cb126-52"><a href="outcome-regression-and-propensity-scores.html#cb126-52" tabindex="-1"></a><span class="co">#&gt; X1    1 86 0.49 0.06   0.47    0.48 0.05 0.42 0.66  0.24  1.1     0.47 0.01</span></span>
+<span id="cb126-53"><a href="outcome-regression-and-propensity-scores.html#cb126-53" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-54"><a href="outcome-regression-and-propensity-scores.html#cb126-54" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-55"><a href="outcome-regression-and-propensity-scores.html#cb126-55" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-56"><a href="outcome-regression-and-propensity-scores.html#cb126-56" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
+<span id="cb126-57"><a href="outcome-regression-and-propensity-scores.html#cb126-57" tabindex="-1"></a><span class="co">#&gt; X1    1 12  0.1 0.02   0.11     0.1 0.03 0.06 0.13  0.07 -0.5    -1.36 0.01</span></span>
+<span id="cb126-58"><a href="outcome-regression-and-propensity-scores.html#cb126-58" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-59"><a href="outcome-regression-and-propensity-scores.html#cb126-59" tabindex="-1"></a><span class="co">#&gt; : 2</span></span>
+<span id="cb126-60"><a href="outcome-regression-and-propensity-scores.html#cb126-60" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-61"><a href="outcome-regression-and-propensity-scores.html#cb126-61" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-62"><a href="outcome-regression-and-propensity-scores.html#cb126-62" tabindex="-1"></a><span class="co">#&gt; X1    1 27 0.15 0.01   0.15    0.15 0.01 0.13 0.17  0.03 -0.03    -1.34  0</span></span>
+<span id="cb126-63"><a href="outcome-regression-and-propensity-scores.html#cb126-63" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-64"><a href="outcome-regression-and-propensity-scores.html#cb126-64" tabindex="-1"></a><span class="co">#&gt; : 3</span></span>
+<span id="cb126-65"><a href="outcome-regression-and-propensity-scores.html#cb126-65" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-66"><a href="outcome-regression-and-propensity-scores.html#cb126-66" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-67"><a href="outcome-regression-and-propensity-scores.html#cb126-67" tabindex="-1"></a><span class="co">#&gt; X1    1 29 0.18 0.01   0.18    0.18 0.01 0.17 0.19  0.03 0.01    -1.34  0</span></span>
+<span id="cb126-68"><a href="outcome-regression-and-propensity-scores.html#cb126-68" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-69"><a href="outcome-regression-and-propensity-scores.html#cb126-69" tabindex="-1"></a><span class="co">#&gt; : 4</span></span>
+<span id="cb126-70"><a href="outcome-regression-and-propensity-scores.html#cb126-70" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-71"><a href="outcome-regression-and-propensity-scores.html#cb126-71" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range  skew kurtosis se</span></span>
+<span id="cb126-72"><a href="outcome-regression-and-propensity-scores.html#cb126-72" tabindex="-1"></a><span class="co">#&gt; X1    1 34 0.21 0.01   0.21    0.21 0.01 0.19 0.22  0.02 -0.31    -1.23  0</span></span>
+<span id="cb126-73"><a href="outcome-regression-and-propensity-scores.html#cb126-73" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-74"><a href="outcome-regression-and-propensity-scores.html#cb126-74" tabindex="-1"></a><span class="co">#&gt; : 5</span></span>
+<span id="cb126-75"><a href="outcome-regression-and-propensity-scores.html#cb126-75" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-76"><a href="outcome-regression-and-propensity-scores.html#cb126-76" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-77"><a href="outcome-regression-and-propensity-scores.html#cb126-77" tabindex="-1"></a><span class="co">#&gt; X1    1 43 0.23 0.01   0.23    0.23 0.01 0.22 0.25  0.03 0.11    -1.23  0</span></span>
+<span id="cb126-78"><a href="outcome-regression-and-propensity-scores.html#cb126-78" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-79"><a href="outcome-regression-and-propensity-scores.html#cb126-79" tabindex="-1"></a><span class="co">#&gt; : 6</span></span>
+<span id="cb126-80"><a href="outcome-regression-and-propensity-scores.html#cb126-80" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-81"><a href="outcome-regression-and-propensity-scores.html#cb126-81" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-82"><a href="outcome-regression-and-propensity-scores.html#cb126-82" tabindex="-1"></a><span class="co">#&gt; X1    1 45 0.26 0.01   0.26    0.26 0.01 0.25 0.27  0.03  0.2    -1.12  0</span></span>
+<span id="cb126-83"><a href="outcome-regression-and-propensity-scores.html#cb126-83" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-84"><a href="outcome-regression-and-propensity-scores.html#cb126-84" tabindex="-1"></a><span class="co">#&gt; : 7</span></span>
+<span id="cb126-85"><a href="outcome-regression-and-propensity-scores.html#cb126-85" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-86"><a href="outcome-regression-and-propensity-scores.html#cb126-86" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-87"><a href="outcome-regression-and-propensity-scores.html#cb126-87" tabindex="-1"></a><span class="co">#&gt; X1    1 43 0.29 0.01   0.29    0.29 0.01 0.27 0.31  0.03 0.16    -1.25  0</span></span>
+<span id="cb126-88"><a href="outcome-regression-and-propensity-scores.html#cb126-88" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-89"><a href="outcome-regression-and-propensity-scores.html#cb126-89" tabindex="-1"></a><span class="co">#&gt; : 8</span></span>
+<span id="cb126-90"><a href="outcome-regression-and-propensity-scores.html#cb126-90" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-91"><a href="outcome-regression-and-propensity-scores.html#cb126-91" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-92"><a href="outcome-regression-and-propensity-scores.html#cb126-92" tabindex="-1"></a><span class="co">#&gt; X1    1 51 0.33 0.01   0.33    0.33 0.02 0.31 0.35  0.04 0.11    -1.19  0</span></span>
+<span id="cb126-93"><a href="outcome-regression-and-propensity-scores.html#cb126-93" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-94"><a href="outcome-regression-and-propensity-scores.html#cb126-94" tabindex="-1"></a><span class="co">#&gt; : 9</span></span>
+<span id="cb126-95"><a href="outcome-regression-and-propensity-scores.html#cb126-95" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-96"><a href="outcome-regression-and-propensity-scores.html#cb126-96" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis se</span></span>
+<span id="cb126-97"><a href="outcome-regression-and-propensity-scores.html#cb126-97" tabindex="-1"></a><span class="co">#&gt; X1    1 67 0.38 0.02   0.38    0.38 0.03 0.35 0.42  0.06 0.19    -1.27  0</span></span>
+<span id="cb126-98"><a href="outcome-regression-and-propensity-scores.html#cb126-98" tabindex="-1"></a><span class="co">#&gt; ------------------------------------------------------------ </span></span>
+<span id="cb126-99"><a href="outcome-regression-and-propensity-scores.html#cb126-99" tabindex="-1"></a><span class="co">#&gt; : 10</span></span>
+<span id="cb126-100"><a href="outcome-regression-and-propensity-scores.html#cb126-100" tabindex="-1"></a><span class="co">#&gt; : 1</span></span>
+<span id="cb126-101"><a href="outcome-regression-and-propensity-scores.html#cb126-101" tabindex="-1"></a><span class="co">#&gt;    vars  n mean   sd median trimmed  mad  min  max range skew kurtosis   se</span></span>
+<span id="cb126-102"><a href="outcome-regression-and-propensity-scores.html#cb126-102" tabindex="-1"></a><span class="co">#&gt; X1    1 77 0.52 0.08   0.51    0.51 0.08 0.42 0.79  0.38 0.88     0.81 0.01</span></span></code></pre></div>
+<div class="sourceCode" id="cb127"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb127-1"><a href="outcome-regression-and-propensity-scores.html#cb127-1" tabindex="-1"></a></span>
+<span id="cb127-2"><a href="outcome-regression-and-propensity-scores.html#cb127-2" tabindex="-1"></a><span class="co"># function to create deciles easily</span></span>
+<span id="cb127-3"><a href="outcome-regression-and-propensity-scores.html#cb127-3" tabindex="-1"></a>decile <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {</span>
+<span id="cb127-4"><a href="outcome-regression-and-propensity-scores.html#cb127-4" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">factor</span>(<span class="fu">quantcut</span>(x, <span class="fu">seq</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="fl">0.1</span>), <span class="at">labels =</span> <span class="cn">FALSE</span>)))</span>
+<span id="cb127-5"><a href="outcome-regression-and-propensity-scores.html#cb127-5" tabindex="-1"></a>}</span>
+<span id="cb127-6"><a href="outcome-regression-and-propensity-scores.html#cb127-6" tabindex="-1"></a></span>
+<span id="cb127-7"><a href="outcome-regression-and-propensity-scores.html#cb127-7" tabindex="-1"></a><span class="co"># regression on PS deciles, allowing for effect modification</span></span>
+<span id="cb127-8"><a href="outcome-regression-and-propensity-scores.html#cb127-8" tabindex="-1"></a><span class="cf">for</span> (deciles <span class="cf">in</span> <span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">10</span>)) {</span>
+<span id="cb127-9"><a href="outcome-regression-and-propensity-scores.html#cb127-9" tabindex="-1"></a>  <span class="fu">print</span>(<span class="fu">t.test</span>(wt82_71<span class="sc">~</span>qsmk, <span class="at">data=</span>nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>ps.dec<span class="sc">==</span>deciles),]))</span>
+<span id="cb127-10"><a href="outcome-regression-and-propensity-scores.html#cb127-10" tabindex="-1"></a>}</span>
+<span id="cb127-11"><a href="outcome-regression-and-propensity-scores.html#cb127-11" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-12"><a href="outcome-regression-and-propensity-scores.html#cb127-12" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-13"><a href="outcome-regression-and-propensity-scores.html#cb127-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-14"><a href="outcome-regression-and-propensity-scores.html#cb127-14" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-15"><a href="outcome-regression-and-propensity-scores.html#cb127-15" tabindex="-1"></a><span class="co">#&gt; t = 0.0060506, df = 11.571, p-value = 0.9953</span></span>
+<span id="cb127-16"><a href="outcome-regression-and-propensity-scores.html#cb127-16" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-17"><a href="outcome-regression-and-propensity-scores.html#cb127-17" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-18"><a href="outcome-regression-and-propensity-scores.html#cb127-18" tabindex="-1"></a><span class="co">#&gt;  -5.283903  5.313210</span></span>
+<span id="cb127-19"><a href="outcome-regression-and-propensity-scores.html#cb127-19" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-20"><a href="outcome-regression-and-propensity-scores.html#cb127-20" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-21"><a href="outcome-regression-and-propensity-scores.html#cb127-21" tabindex="-1"></a><span class="co">#&gt;        3.995205        3.980551 </span></span>
+<span id="cb127-22"><a href="outcome-regression-and-propensity-scores.html#cb127-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-23"><a href="outcome-regression-and-propensity-scores.html#cb127-23" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-24"><a href="outcome-regression-and-propensity-scores.html#cb127-24" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-25"><a href="outcome-regression-and-propensity-scores.html#cb127-25" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-26"><a href="outcome-regression-and-propensity-scores.html#cb127-26" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-27"><a href="outcome-regression-and-propensity-scores.html#cb127-27" tabindex="-1"></a><span class="co">#&gt; t = -3.1117, df = 37.365, p-value = 0.003556</span></span>
+<span id="cb127-28"><a href="outcome-regression-and-propensity-scores.html#cb127-28" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-29"><a href="outcome-regression-and-propensity-scores.html#cb127-29" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-30"><a href="outcome-regression-and-propensity-scores.html#cb127-30" tabindex="-1"></a><span class="co">#&gt;  -6.849335 -1.448161</span></span>
+<span id="cb127-31"><a href="outcome-regression-and-propensity-scores.html#cb127-31" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-32"><a href="outcome-regression-and-propensity-scores.html#cb127-32" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-33"><a href="outcome-regression-and-propensity-scores.html#cb127-33" tabindex="-1"></a><span class="co">#&gt;        2.904679        7.053426 </span></span>
+<span id="cb127-34"><a href="outcome-regression-and-propensity-scores.html#cb127-34" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-35"><a href="outcome-regression-and-propensity-scores.html#cb127-35" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-36"><a href="outcome-regression-and-propensity-scores.html#cb127-36" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-37"><a href="outcome-regression-and-propensity-scores.html#cb127-37" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-38"><a href="outcome-regression-and-propensity-scores.html#cb127-38" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-39"><a href="outcome-regression-and-propensity-scores.html#cb127-39" tabindex="-1"></a><span class="co">#&gt; t = -4.5301, df = 35.79, p-value = 6.317e-05</span></span>
+<span id="cb127-40"><a href="outcome-regression-and-propensity-scores.html#cb127-40" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-41"><a href="outcome-regression-and-propensity-scores.html#cb127-41" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-42"><a href="outcome-regression-and-propensity-scores.html#cb127-42" tabindex="-1"></a><span class="co">#&gt;  -9.474961 -3.613990</span></span>
+<span id="cb127-43"><a href="outcome-regression-and-propensity-scores.html#cb127-43" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-44"><a href="outcome-regression-and-propensity-scores.html#cb127-44" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-45"><a href="outcome-regression-and-propensity-scores.html#cb127-45" tabindex="-1"></a><span class="co">#&gt;        2.612094        9.156570 </span></span>
+<span id="cb127-46"><a href="outcome-regression-and-propensity-scores.html#cb127-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-47"><a href="outcome-regression-and-propensity-scores.html#cb127-47" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-48"><a href="outcome-regression-and-propensity-scores.html#cb127-48" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-49"><a href="outcome-regression-and-propensity-scores.html#cb127-49" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-50"><a href="outcome-regression-and-propensity-scores.html#cb127-50" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-51"><a href="outcome-regression-and-propensity-scores.html#cb127-51" tabindex="-1"></a><span class="co">#&gt; t = -1.4117, df = 45.444, p-value = 0.1648</span></span>
+<span id="cb127-52"><a href="outcome-regression-and-propensity-scores.html#cb127-52" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-53"><a href="outcome-regression-and-propensity-scores.html#cb127-53" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-54"><a href="outcome-regression-and-propensity-scores.html#cb127-54" tabindex="-1"></a><span class="co">#&gt;  -5.6831731  0.9985715</span></span>
+<span id="cb127-55"><a href="outcome-regression-and-propensity-scores.html#cb127-55" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-56"><a href="outcome-regression-and-propensity-scores.html#cb127-56" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-57"><a href="outcome-regression-and-propensity-scores.html#cb127-57" tabindex="-1"></a><span class="co">#&gt;        3.474679        5.816979 </span></span>
+<span id="cb127-58"><a href="outcome-regression-and-propensity-scores.html#cb127-58" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-59"><a href="outcome-regression-and-propensity-scores.html#cb127-59" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-60"><a href="outcome-regression-and-propensity-scores.html#cb127-60" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-61"><a href="outcome-regression-and-propensity-scores.html#cb127-61" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-62"><a href="outcome-regression-and-propensity-scores.html#cb127-62" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-63"><a href="outcome-regression-and-propensity-scores.html#cb127-63" tabindex="-1"></a><span class="co">#&gt; t = -3.1371, df = 74.249, p-value = 0.002446</span></span>
+<span id="cb127-64"><a href="outcome-regression-and-propensity-scores.html#cb127-64" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-65"><a href="outcome-regression-and-propensity-scores.html#cb127-65" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-66"><a href="outcome-regression-and-propensity-scores.html#cb127-66" tabindex="-1"></a><span class="co">#&gt;  -6.753621 -1.507087</span></span>
+<span id="cb127-67"><a href="outcome-regression-and-propensity-scores.html#cb127-67" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-68"><a href="outcome-regression-and-propensity-scores.html#cb127-68" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-69"><a href="outcome-regression-and-propensity-scores.html#cb127-69" tabindex="-1"></a><span class="co">#&gt;        2.098800        6.229154 </span></span>
+<span id="cb127-70"><a href="outcome-regression-and-propensity-scores.html#cb127-70" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-71"><a href="outcome-regression-and-propensity-scores.html#cb127-71" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-72"><a href="outcome-regression-and-propensity-scores.html#cb127-72" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-73"><a href="outcome-regression-and-propensity-scores.html#cb127-73" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-74"><a href="outcome-regression-and-propensity-scores.html#cb127-74" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-75"><a href="outcome-regression-and-propensity-scores.html#cb127-75" tabindex="-1"></a><span class="co">#&gt; t = -2.1677, df = 50.665, p-value = 0.0349</span></span>
+<span id="cb127-76"><a href="outcome-regression-and-propensity-scores.html#cb127-76" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-77"><a href="outcome-regression-and-propensity-scores.html#cb127-77" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-78"><a href="outcome-regression-and-propensity-scores.html#cb127-78" tabindex="-1"></a><span class="co">#&gt;  -8.7516605 -0.3350127</span></span>
+<span id="cb127-79"><a href="outcome-regression-and-propensity-scores.html#cb127-79" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-80"><a href="outcome-regression-and-propensity-scores.html#cb127-80" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-81"><a href="outcome-regression-and-propensity-scores.html#cb127-81" tabindex="-1"></a><span class="co">#&gt;        1.847004        6.390340 </span></span>
+<span id="cb127-82"><a href="outcome-regression-and-propensity-scores.html#cb127-82" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-83"><a href="outcome-regression-and-propensity-scores.html#cb127-83" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-84"><a href="outcome-regression-and-propensity-scores.html#cb127-84" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-85"><a href="outcome-regression-and-propensity-scores.html#cb127-85" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-86"><a href="outcome-regression-and-propensity-scores.html#cb127-86" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-87"><a href="outcome-regression-and-propensity-scores.html#cb127-87" tabindex="-1"></a><span class="co">#&gt; t = -3.3155, df = 84.724, p-value = 0.001348</span></span>
+<span id="cb127-88"><a href="outcome-regression-and-propensity-scores.html#cb127-88" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-89"><a href="outcome-regression-and-propensity-scores.html#cb127-89" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-90"><a href="outcome-regression-and-propensity-scores.html#cb127-90" tabindex="-1"></a><span class="co">#&gt;  -6.904207 -1.727590</span></span>
+<span id="cb127-91"><a href="outcome-regression-and-propensity-scores.html#cb127-91" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-92"><a href="outcome-regression-and-propensity-scores.html#cb127-92" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-93"><a href="outcome-regression-and-propensity-scores.html#cb127-93" tabindex="-1"></a><span class="co">#&gt;        1.560048        5.875946 </span></span>
+<span id="cb127-94"><a href="outcome-regression-and-propensity-scores.html#cb127-94" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-95"><a href="outcome-regression-and-propensity-scores.html#cb127-95" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-96"><a href="outcome-regression-and-propensity-scores.html#cb127-96" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-97"><a href="outcome-regression-and-propensity-scores.html#cb127-97" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-98"><a href="outcome-regression-and-propensity-scores.html#cb127-98" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-99"><a href="outcome-regression-and-propensity-scores.html#cb127-99" tabindex="-1"></a><span class="co">#&gt; t = -2.664, df = 75.306, p-value = 0.009441</span></span>
+<span id="cb127-100"><a href="outcome-regression-and-propensity-scores.html#cb127-100" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-101"><a href="outcome-regression-and-propensity-scores.html#cb127-101" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-102"><a href="outcome-regression-and-propensity-scores.html#cb127-102" tabindex="-1"></a><span class="co">#&gt;  -6.2396014 -0.9005605</span></span>
+<span id="cb127-103"><a href="outcome-regression-and-propensity-scores.html#cb127-103" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-104"><a href="outcome-regression-and-propensity-scores.html#cb127-104" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-105"><a href="outcome-regression-and-propensity-scores.html#cb127-105" tabindex="-1"></a><span class="co">#&gt;       0.2846851       3.8547661 </span></span>
+<span id="cb127-106"><a href="outcome-regression-and-propensity-scores.html#cb127-106" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-107"><a href="outcome-regression-and-propensity-scores.html#cb127-107" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-108"><a href="outcome-regression-and-propensity-scores.html#cb127-108" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-109"><a href="outcome-regression-and-propensity-scores.html#cb127-109" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-110"><a href="outcome-regression-and-propensity-scores.html#cb127-110" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-111"><a href="outcome-regression-and-propensity-scores.html#cb127-111" tabindex="-1"></a><span class="co">#&gt; t = -1.9122, df = 129.12, p-value = 0.05806</span></span>
+<span id="cb127-112"><a href="outcome-regression-and-propensity-scores.html#cb127-112" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-113"><a href="outcome-regression-and-propensity-scores.html#cb127-113" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-114"><a href="outcome-regression-and-propensity-scores.html#cb127-114" tabindex="-1"></a><span class="co">#&gt;  -4.68143608  0.07973698</span></span>
+<span id="cb127-115"><a href="outcome-regression-and-propensity-scores.html#cb127-115" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-116"><a href="outcome-regression-and-propensity-scores.html#cb127-116" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-117"><a href="outcome-regression-and-propensity-scores.html#cb127-117" tabindex="-1"></a><span class="co">#&gt;      -0.8954482       1.4054014 </span></span>
+<span id="cb127-118"><a href="outcome-regression-and-propensity-scores.html#cb127-118" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-119"><a href="outcome-regression-and-propensity-scores.html#cb127-119" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-120"><a href="outcome-regression-and-propensity-scores.html#cb127-120" tabindex="-1"></a><span class="co">#&gt;  Welch Two Sample t-test</span></span>
+<span id="cb127-121"><a href="outcome-regression-and-propensity-scores.html#cb127-121" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb127-122"><a href="outcome-regression-and-propensity-scores.html#cb127-122" tabindex="-1"></a><span class="co">#&gt; data:  wt82_71 by qsmk</span></span>
+<span id="cb127-123"><a href="outcome-regression-and-propensity-scores.html#cb127-123" tabindex="-1"></a><span class="co">#&gt; t = -1.5925, df = 142.72, p-value = 0.1135</span></span>
+<span id="cb127-124"><a href="outcome-regression-and-propensity-scores.html#cb127-124" tabindex="-1"></a><span class="co">#&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0</span></span>
+<span id="cb127-125"><a href="outcome-regression-and-propensity-scores.html#cb127-125" tabindex="-1"></a><span class="co">#&gt; 95 percent confidence interval:</span></span>
+<span id="cb127-126"><a href="outcome-regression-and-propensity-scores.html#cb127-126" tabindex="-1"></a><span class="co">#&gt;  -5.0209284  0.5404697</span></span>
+<span id="cb127-127"><a href="outcome-regression-and-propensity-scores.html#cb127-127" tabindex="-1"></a><span class="co">#&gt; sample estimates:</span></span>
+<span id="cb127-128"><a href="outcome-regression-and-propensity-scores.html#cb127-128" tabindex="-1"></a><span class="co">#&gt; mean in group 0 mean in group 1 </span></span>
+<span id="cb127-129"><a href="outcome-regression-and-propensity-scores.html#cb127-129" tabindex="-1"></a><span class="co">#&gt;      -0.5043766       1.7358528</span></span></code></pre></div>
+<div class="sourceCode" id="cb128"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb128-1"><a href="outcome-regression-and-propensity-scores.html#cb128-1" tabindex="-1"></a></span>
+<span id="cb128-2"><a href="outcome-regression-and-propensity-scores.html#cb128-2" tabindex="-1"></a><span class="co"># regression on PS deciles, not allowing for effect modification</span></span>
+<span id="cb128-3"><a href="outcome-regression-and-propensity-scores.html#cb128-3" tabindex="-1"></a>fit.psdec <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> <span class="fu">as.factor</span>(ps.dec), <span class="at">data =</span> nhefs)</span>
+<span id="cb128-4"><a href="outcome-regression-and-propensity-scores.html#cb128-4" tabindex="-1"></a><span class="fu">summary</span>(fit.psdec)</span>
+<span id="cb128-5"><a href="outcome-regression-and-propensity-scores.html#cb128-5" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb128-6"><a href="outcome-regression-and-propensity-scores.html#cb128-6" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb128-7"><a href="outcome-regression-and-propensity-scores.html#cb128-7" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs)</span></span>
+<span id="cb128-8"><a href="outcome-regression-and-propensity-scores.html#cb128-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb128-9"><a href="outcome-regression-and-propensity-scores.html#cb128-9" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb128-10"><a href="outcome-regression-and-propensity-scores.html#cb128-10" tabindex="-1"></a><span class="co">#&gt;                     Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb128-11"><a href="outcome-regression-and-propensity-scores.html#cb128-11" tabindex="-1"></a><span class="co">#&gt; (Intercept)           3.7505     0.6089   6.159 9.29e-10 ***</span></span>
+<span id="cb128-12"><a href="outcome-regression-and-propensity-scores.html#cb128-12" tabindex="-1"></a><span class="co">#&gt; qsmk                  3.5005     0.4571   7.659 3.28e-14 ***</span></span>
+<span id="cb128-13"><a href="outcome-regression-and-propensity-scores.html#cb128-13" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)2   -0.7391     0.8611  -0.858   0.3908    </span></span>
+<span id="cb128-14"><a href="outcome-regression-and-propensity-scores.html#cb128-14" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)3   -0.6182     0.8612  -0.718   0.4730    </span></span>
+<span id="cb128-15"><a href="outcome-regression-and-propensity-scores.html#cb128-15" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)4   -0.5204     0.8584  -0.606   0.5444    </span></span>
+<span id="cb128-16"><a href="outcome-regression-and-propensity-scores.html#cb128-16" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)5   -1.4884     0.8590  -1.733   0.0834 .  </span></span>
+<span id="cb128-17"><a href="outcome-regression-and-propensity-scores.html#cb128-17" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)6   -1.6227     0.8675  -1.871   0.0616 .  </span></span>
+<span id="cb128-18"><a href="outcome-regression-and-propensity-scores.html#cb128-18" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)7   -1.9853     0.8681  -2.287   0.0223 *  </span></span>
+<span id="cb128-19"><a href="outcome-regression-and-propensity-scores.html#cb128-19" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)8   -3.4447     0.8749  -3.937 8.61e-05 ***</span></span>
+<span id="cb128-20"><a href="outcome-regression-and-propensity-scores.html#cb128-20" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)9   -5.1544     0.8848  -5.825 6.91e-09 ***</span></span>
+<span id="cb128-21"><a href="outcome-regression-and-propensity-scores.html#cb128-21" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)10  -4.8403     0.8828  -5.483 4.87e-08 ***</span></span>
+<span id="cb128-22"><a href="outcome-regression-and-propensity-scores.html#cb128-22" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb128-23"><a href="outcome-regression-and-propensity-scores.html#cb128-23" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb128-24"><a href="outcome-regression-and-propensity-scores.html#cb128-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb128-25"><a href="outcome-regression-and-propensity-scores.html#cb128-25" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 58.42297)</span></span>
+<span id="cb128-26"><a href="outcome-regression-and-propensity-scores.html#cb128-26" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb128-27"><a href="outcome-regression-and-propensity-scores.html#cb128-27" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb128-28"><a href="outcome-regression-and-propensity-scores.html#cb128-28" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 90848  on 1555  degrees of freedom</span></span>
+<span id="cb128-29"><a href="outcome-regression-and-propensity-scores.html#cb128-29" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb128-30"><a href="outcome-regression-and-propensity-scores.html#cb128-30" tabindex="-1"></a><span class="co">#&gt; AIC: 10827</span></span>
+<span id="cb128-31"><a href="outcome-regression-and-propensity-scores.html#cb128-31" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb128-32"><a href="outcome-regression-and-propensity-scores.html#cb128-32" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb129"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb129-1"><a href="outcome-regression-and-propensity-scores.html#cb129-1" tabindex="-1"></a><span class="fu">confint.lm</span>(fit.psdec)</span>
+<span id="cb129-2"><a href="outcome-regression-and-propensity-scores.html#cb129-2" tabindex="-1"></a><span class="co">#&gt;                         2.5 %      97.5 %</span></span>
+<span id="cb129-3"><a href="outcome-regression-and-propensity-scores.html#cb129-3" tabindex="-1"></a><span class="co">#&gt; (Intercept)          2.556098  4.94486263</span></span>
+<span id="cb129-4"><a href="outcome-regression-and-propensity-scores.html#cb129-4" tabindex="-1"></a><span class="co">#&gt; qsmk                 2.603953  4.39700504</span></span>
+<span id="cb129-5"><a href="outcome-regression-and-propensity-scores.html#cb129-5" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)2  -2.428074  0.94982494</span></span>
+<span id="cb129-6"><a href="outcome-regression-and-propensity-scores.html#cb129-6" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)3  -2.307454  1.07103569</span></span>
+<span id="cb129-7"><a href="outcome-regression-and-propensity-scores.html#cb129-7" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)4  -2.204103  1.16333143</span></span>
+<span id="cb129-8"><a href="outcome-regression-and-propensity-scores.html#cb129-8" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)5  -3.173337  0.19657938</span></span>
+<span id="cb129-9"><a href="outcome-regression-and-propensity-scores.html#cb129-9" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)6  -3.324345  0.07893027</span></span>
+<span id="cb129-10"><a href="outcome-regression-and-propensity-scores.html#cb129-10" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)7  -3.688043 -0.28248110</span></span>
+<span id="cb129-11"><a href="outcome-regression-and-propensity-scores.html#cb129-11" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)8  -5.160862 -1.72860113</span></span>
+<span id="cb129-12"><a href="outcome-regression-and-propensity-scores.html#cb129-12" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)9  -6.889923 -3.41883853</span></span>
+<span id="cb129-13"><a href="outcome-regression-and-propensity-scores.html#cb129-13" tabindex="-1"></a><span class="co">#&gt; as.factor(ps.dec)10 -6.571789 -3.10873731</span></span></code></pre></div>
 </div>
 <div id="program-15.4" class="section level2 hasAnchor">
 <h2>Program 15.4<a href="outcome-regression-and-propensity-scores.html#program-15.4" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -964,164 +964,164 @@ <h2>Program 15.4<a href="outcome-regression-and-propensity-scores.html#program-1
 <li>Standardization using the propensity score</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb35"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb35-1"><a href="outcome-regression-and-propensity-scores.html#cb35-1" tabindex="-1"></a><span class="co">#install.packages(&quot;boot&quot;) # install package if required</span></span>
-<span id="cb35-2"><a href="outcome-regression-and-propensity-scores.html#cb35-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;boot&quot;</span>)</span>
-<span id="cb35-3"><a href="outcome-regression-and-propensity-scores.html#cb35-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb35-4"><a href="outcome-regression-and-propensity-scores.html#cb35-4" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;boot&#39;</span></span>
-<span id="cb35-5"><a href="outcome-regression-and-propensity-scores.html#cb35-5" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:psych&#39;:</span></span>
-<span id="cb35-6"><a href="outcome-regression-and-propensity-scores.html#cb35-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb35-7"><a href="outcome-regression-and-propensity-scores.html#cb35-7" tabindex="-1"></a><span class="co">#&gt;     logit</span></span>
-<span id="cb35-8"><a href="outcome-regression-and-propensity-scores.html#cb35-8" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:survival&#39;:</span></span>
-<span id="cb35-9"><a href="outcome-regression-and-propensity-scores.html#cb35-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb35-10"><a href="outcome-regression-and-propensity-scores.html#cb35-10" tabindex="-1"></a><span class="co">#&gt;     aml</span></span>
-<span id="cb35-11"><a href="outcome-regression-and-propensity-scores.html#cb35-11" tabindex="-1"></a></span>
-<span id="cb35-12"><a href="outcome-regression-and-propensity-scores.html#cb35-12" tabindex="-1"></a><span class="co"># standardization by propensity score, agnostic regarding effect modification</span></span>
-<span id="cb35-13"><a href="outcome-regression-and-propensity-scores.html#cb35-13" tabindex="-1"></a>std.ps <span class="ot">&lt;-</span> <span class="cf">function</span>(data, indices) {</span>
-<span id="cb35-14"><a href="outcome-regression-and-propensity-scores.html#cb35-14" tabindex="-1"></a>  d <span class="ot">&lt;-</span> data[indices,] <span class="co"># 1st copy: equal to original one`</span></span>
-<span id="cb35-15"><a href="outcome-regression-and-propensity-scores.html#cb35-15" tabindex="-1"></a>  <span class="co"># calculating propensity scores</span></span>
-<span id="cb35-16"><a href="outcome-regression-and-propensity-scores.html#cb35-16" tabindex="-1"></a>  ps.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
-<span id="cb35-17"><a href="outcome-regression-and-propensity-scores.html#cb35-17" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
-<span id="cb35-18"><a href="outcome-regression-and-propensity-scores.html#cb35-18" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb35-19"><a href="outcome-regression-and-propensity-scores.html#cb35-19" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb35-20"><a href="outcome-regression-and-propensity-scores.html#cb35-20" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
-<span id="cb35-21"><a href="outcome-regression-and-propensity-scores.html#cb35-21" tabindex="-1"></a>                <span class="at">data=</span>d, <span class="at">family=</span><span class="fu">binomial</span>())</span>
-<span id="cb35-22"><a href="outcome-regression-and-propensity-scores.html#cb35-22" tabindex="-1"></a>  d<span class="sc">$</span>pscore <span class="ot">&lt;-</span> <span class="fu">predict</span>(ps.fit, d, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
-<span id="cb35-23"><a href="outcome-regression-and-propensity-scores.html#cb35-23" tabindex="-1"></a></span>
-<span id="cb35-24"><a href="outcome-regression-and-propensity-scores.html#cb35-24" tabindex="-1"></a>  <span class="co"># create a dataset with 3 copies of each subject</span></span>
-<span id="cb35-25"><a href="outcome-regression-and-propensity-scores.html#cb35-25" tabindex="-1"></a>  d<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span> <span class="co"># 1st copy: equal to original one`</span></span>
-<span id="cb35-26"><a href="outcome-regression-and-propensity-scores.html#cb35-26" tabindex="-1"></a>  d0 <span class="ot">&lt;-</span> d <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
-<span id="cb35-27"><a href="outcome-regression-and-propensity-scores.html#cb35-27" tabindex="-1"></a>  d0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb35-28"><a href="outcome-regression-and-propensity-scores.html#cb35-28" tabindex="-1"></a>  d0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb35-29"><a href="outcome-regression-and-propensity-scores.html#cb35-29" tabindex="-1"></a>  d0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb35-30"><a href="outcome-regression-and-propensity-scores.html#cb35-30" tabindex="-1"></a>  d1 <span class="ot">&lt;-</span> d <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
-<span id="cb35-31"><a href="outcome-regression-and-propensity-scores.html#cb35-31" tabindex="-1"></a>  d1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb35-32"><a href="outcome-regression-and-propensity-scores.html#cb35-32" tabindex="-1"></a>  d1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb35-33"><a href="outcome-regression-and-propensity-scores.html#cb35-33" tabindex="-1"></a>  d1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb35-34"><a href="outcome-regression-and-propensity-scores.html#cb35-34" tabindex="-1"></a>  d.onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(d, d0, d1) <span class="co"># combining datasets</span></span>
-<span id="cb35-35"><a href="outcome-regression-and-propensity-scores.html#cb35-35" tabindex="-1"></a></span>
-<span id="cb35-36"><a href="outcome-regression-and-propensity-scores.html#cb35-36" tabindex="-1"></a>  std.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> pscore <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>pscore), <span class="at">data=</span>d.onesample)</span>
-<span id="cb35-37"><a href="outcome-regression-and-propensity-scores.html#cb35-37" tabindex="-1"></a>  d.onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(std.fit, d.onesample)</span>
-<span id="cb35-38"><a href="outcome-regression-and-propensity-scores.html#cb35-38" tabindex="-1"></a></span>
-<span id="cb35-39"><a href="outcome-regression-and-propensity-scores.html#cb35-39" tabindex="-1"></a>  <span class="co"># estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1</span></span>
-<span id="cb35-40"><a href="outcome-regression-and-propensity-scores.html#cb35-40" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">c</span>(<span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==-</span><span class="dv">1</span>]),</span>
-<span id="cb35-41"><a href="outcome-regression-and-propensity-scores.html#cb35-41" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">0</span>]),</span>
-<span id="cb35-42"><a href="outcome-regression-and-propensity-scores.html#cb35-42" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">1</span>]),</span>
-<span id="cb35-43"><a href="outcome-regression-and-propensity-scores.html#cb35-43" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">1</span>])<span class="sc">-</span></span>
-<span id="cb35-44"><a href="outcome-regression-and-propensity-scores.html#cb35-44" tabindex="-1"></a>             <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">0</span>])))</span>
-<span id="cb35-45"><a href="outcome-regression-and-propensity-scores.html#cb35-45" tabindex="-1"></a>}</span>
-<span id="cb35-46"><a href="outcome-regression-and-propensity-scores.html#cb35-46" tabindex="-1"></a></span>
-<span id="cb35-47"><a href="outcome-regression-and-propensity-scores.html#cb35-47" tabindex="-1"></a><span class="co"># bootstrap</span></span>
-<span id="cb35-48"><a href="outcome-regression-and-propensity-scores.html#cb35-48" tabindex="-1"></a>results <span class="ot">&lt;-</span> <span class="fu">boot</span>(<span class="at">data=</span>nhefs, <span class="at">statistic=</span>std.ps, <span class="at">R=</span><span class="dv">5</span>)</span>
-<span id="cb35-49"><a href="outcome-regression-and-propensity-scores.html#cb35-49" tabindex="-1"></a></span>
-<span id="cb35-50"><a href="outcome-regression-and-propensity-scores.html#cb35-50" tabindex="-1"></a><span class="co"># generating confidence intervals</span></span>
-<span id="cb35-51"><a href="outcome-regression-and-propensity-scores.html#cb35-51" tabindex="-1"></a>se <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">1</span>]), <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">2</span>]),</span>
-<span id="cb35-52"><a href="outcome-regression-and-propensity-scores.html#cb35-52" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">3</span>]), <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">4</span>]))</span>
-<span id="cb35-53"><a href="outcome-regression-and-propensity-scores.html#cb35-53" tabindex="-1"></a>mean <span class="ot">&lt;-</span> results<span class="sc">$</span>t0</span>
-<span id="cb35-54"><a href="outcome-regression-and-propensity-scores.html#cb35-54" tabindex="-1"></a>ll <span class="ot">&lt;-</span> mean <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>se</span>
-<span id="cb35-55"><a href="outcome-regression-and-propensity-scores.html#cb35-55" tabindex="-1"></a>ul <span class="ot">&lt;-</span> mean <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>se</span>
-<span id="cb35-56"><a href="outcome-regression-and-propensity-scores.html#cb35-56" tabindex="-1"></a></span>
-<span id="cb35-57"><a href="outcome-regression-and-propensity-scores.html#cb35-57" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">c</span>(<span class="st">&quot;Observed&quot;</span>, <span class="st">&quot;No Treatment&quot;</span>, <span class="st">&quot;Treatment&quot;</span>,</span>
-<span id="cb35-58"><a href="outcome-regression-and-propensity-scores.html#cb35-58" tabindex="-1"></a>                                <span class="st">&quot;Treatment - No Treatment&quot;</span>), mean, se, ll, ul))</span>
-<span id="cb35-59"><a href="outcome-regression-and-propensity-scores.html#cb35-59" tabindex="-1"></a>bootstrap</span>
-<span id="cb35-60"><a href="outcome-regression-and-propensity-scores.html#cb35-60" tabindex="-1"></a><span class="co">#&gt;                         V1             mean                 se               ll</span></span>
-<span id="cb35-61"><a href="outcome-regression-and-propensity-scores.html#cb35-61" tabindex="-1"></a><span class="co">#&gt; 1                 Observed 2.63384609228479 0.0827987483280176 2.47156352759688</span></span>
-<span id="cb35-62"><a href="outcome-regression-and-propensity-scores.html#cb35-62" tabindex="-1"></a><span class="co">#&gt; 2             No Treatment 1.71983636149845  0.161487941750904 1.40332581172918</span></span>
-<span id="cb35-63"><a href="outcome-regression-and-propensity-scores.html#cb35-63" tabindex="-1"></a><span class="co">#&gt; 3                Treatment 5.35072300362985  0.688985026710106 4.00033716539068</span></span>
-<span id="cb35-64"><a href="outcome-regression-and-propensity-scores.html#cb35-64" tabindex="-1"></a><span class="co">#&gt; 4 Treatment - No Treatment  3.6308866421314  0.822159808859099 2.01948302723123</span></span>
-<span id="cb35-65"><a href="outcome-regression-and-propensity-scores.html#cb35-65" tabindex="-1"></a><span class="co">#&gt;                 ul</span></span>
-<span id="cb35-66"><a href="outcome-regression-and-propensity-scores.html#cb35-66" tabindex="-1"></a><span class="co">#&gt; 1  2.7961286569727</span></span>
-<span id="cb35-67"><a href="outcome-regression-and-propensity-scores.html#cb35-67" tabindex="-1"></a><span class="co">#&gt; 2 2.03634691126773</span></span>
-<span id="cb35-68"><a href="outcome-regression-and-propensity-scores.html#cb35-68" tabindex="-1"></a><span class="co">#&gt; 3 6.70110884186903</span></span>
-<span id="cb35-69"><a href="outcome-regression-and-propensity-scores.html#cb35-69" tabindex="-1"></a><span class="co">#&gt; 4 5.24229025703157</span></span></code></pre></div>
-<div class="sourceCode" id="cb36"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb36-1"><a href="outcome-regression-and-propensity-scores.html#cb36-1" tabindex="-1"></a><span class="co"># regression on the propensity score (linear term)</span></span>
-<span id="cb36-2"><a href="outcome-regression-and-propensity-scores.html#cb36-2" tabindex="-1"></a>model6 <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> ps, <span class="at">data =</span> nhefs) <span class="co"># p.qsmk</span></span>
-<span id="cb36-3"><a href="outcome-regression-and-propensity-scores.html#cb36-3" tabindex="-1"></a><span class="fu">summary</span>(model6)</span>
-<span id="cb36-4"><a href="outcome-regression-and-propensity-scores.html#cb36-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb36-5"><a href="outcome-regression-and-propensity-scores.html#cb36-5" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb36-6"><a href="outcome-regression-and-propensity-scores.html#cb36-6" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + ps, data = nhefs)</span></span>
-<span id="cb36-7"><a href="outcome-regression-and-propensity-scores.html#cb36-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb36-8"><a href="outcome-regression-and-propensity-scores.html#cb36-8" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb36-9"><a href="outcome-regression-and-propensity-scores.html#cb36-9" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb36-10"><a href="outcome-regression-and-propensity-scores.html#cb36-10" tabindex="-1"></a><span class="co">#&gt; (Intercept)   5.5945     0.4831  11.581  &lt; 2e-16 ***</span></span>
-<span id="cb36-11"><a href="outcome-regression-and-propensity-scores.html#cb36-11" tabindex="-1"></a><span class="co">#&gt; qsmk          3.5506     0.4573   7.765 1.47e-14 ***</span></span>
-<span id="cb36-12"><a href="outcome-regression-and-propensity-scores.html#cb36-12" tabindex="-1"></a><span class="co">#&gt; ps          -14.8218     1.7576  -8.433  &lt; 2e-16 ***</span></span>
-<span id="cb36-13"><a href="outcome-regression-and-propensity-scores.html#cb36-13" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb36-14"><a href="outcome-regression-and-propensity-scores.html#cb36-14" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb36-15"><a href="outcome-regression-and-propensity-scores.html#cb36-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb36-16"><a href="outcome-regression-and-propensity-scores.html#cb36-16" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 58.28455)</span></span>
-<span id="cb36-17"><a href="outcome-regression-and-propensity-scores.html#cb36-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb36-18"><a href="outcome-regression-and-propensity-scores.html#cb36-18" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb36-19"><a href="outcome-regression-and-propensity-scores.html#cb36-19" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 91099  on 1563  degrees of freedom</span></span>
-<span id="cb36-20"><a href="outcome-regression-and-propensity-scores.html#cb36-20" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb36-21"><a href="outcome-regression-and-propensity-scores.html#cb36-21" tabindex="-1"></a><span class="co">#&gt; AIC: 10815</span></span>
-<span id="cb36-22"><a href="outcome-regression-and-propensity-scores.html#cb36-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb36-23"><a href="outcome-regression-and-propensity-scores.html#cb36-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb36-24"><a href="outcome-regression-and-propensity-scores.html#cb36-24" tabindex="-1"></a></span>
-<span id="cb36-25"><a href="outcome-regression-and-propensity-scores.html#cb36-25" tabindex="-1"></a><span class="co"># standarization on the propensity score</span></span>
-<span id="cb36-26"><a href="outcome-regression-and-propensity-scores.html#cb36-26" tabindex="-1"></a><span class="co"># (step 1) create two new datasets, one with all treated and one with all untreated</span></span>
-<span id="cb36-27"><a href="outcome-regression-and-propensity-scores.html#cb36-27" tabindex="-1"></a>treated <span class="ot">&lt;-</span> nhefs</span>
-<span id="cb36-28"><a href="outcome-regression-and-propensity-scores.html#cb36-28" tabindex="-1"></a>  treated<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb36-29"><a href="outcome-regression-and-propensity-scores.html#cb36-29" tabindex="-1"></a></span>
-<span id="cb36-30"><a href="outcome-regression-and-propensity-scores.html#cb36-30" tabindex="-1"></a>untreated <span class="ot">&lt;-</span> nhefs</span>
-<span id="cb36-31"><a href="outcome-regression-and-propensity-scores.html#cb36-31" tabindex="-1"></a>  untreated<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb36-32"><a href="outcome-regression-and-propensity-scores.html#cb36-32" tabindex="-1"></a></span>
-<span id="cb36-33"><a href="outcome-regression-and-propensity-scores.html#cb36-33" tabindex="-1"></a><span class="co"># (step 2) predict values for everyone in each new dataset based on above model</span></span>
-<span id="cb36-34"><a href="outcome-regression-and-propensity-scores.html#cb36-34" tabindex="-1"></a>treated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(model6, treated)</span>
-<span id="cb36-35"><a href="outcome-regression-and-propensity-scores.html#cb36-35" tabindex="-1"></a>untreated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(model6, untreated)</span>
-<span id="cb36-36"><a href="outcome-regression-and-propensity-scores.html#cb36-36" tabindex="-1"></a></span>
-<span id="cb36-37"><a href="outcome-regression-and-propensity-scores.html#cb36-37" tabindex="-1"></a><span class="co"># (step 3) compare mean weight loss had all been treated vs. that had all been untreated</span></span>
-<span id="cb36-38"><a href="outcome-regression-and-propensity-scores.html#cb36-38" tabindex="-1"></a>mean1 <span class="ot">&lt;-</span> <span class="fu">mean</span>(treated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
-<span id="cb36-39"><a href="outcome-regression-and-propensity-scores.html#cb36-39" tabindex="-1"></a>mean0 <span class="ot">&lt;-</span> <span class="fu">mean</span>(untreated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
-<span id="cb36-40"><a href="outcome-regression-and-propensity-scores.html#cb36-40" tabindex="-1"></a>mean1</span>
-<span id="cb36-41"><a href="outcome-regression-and-propensity-scores.html#cb36-41" tabindex="-1"></a><span class="co">#&gt; [1] 5.250824</span></span>
-<span id="cb36-42"><a href="outcome-regression-and-propensity-scores.html#cb36-42" tabindex="-1"></a>mean0</span>
-<span id="cb36-43"><a href="outcome-regression-and-propensity-scores.html#cb36-43" tabindex="-1"></a><span class="co">#&gt; [1] 1.700228</span></span>
-<span id="cb36-44"><a href="outcome-regression-and-propensity-scores.html#cb36-44" tabindex="-1"></a>mean1 <span class="sc">-</span> mean0</span>
-<span id="cb36-45"><a href="outcome-regression-and-propensity-scores.html#cb36-45" tabindex="-1"></a><span class="co">#&gt; [1] 3.550596</span></span>
-<span id="cb36-46"><a href="outcome-regression-and-propensity-scores.html#cb36-46" tabindex="-1"></a></span>
-<span id="cb36-47"><a href="outcome-regression-and-propensity-scores.html#cb36-47" tabindex="-1"></a><span class="co"># (step 4) bootstrap a confidence interval</span></span>
-<span id="cb36-48"><a href="outcome-regression-and-propensity-scores.html#cb36-48" tabindex="-1"></a><span class="co"># number of bootstraps</span></span>
-<span id="cb36-49"><a href="outcome-regression-and-propensity-scores.html#cb36-49" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">100</span></span>
-<span id="cb36-50"><a href="outcome-regression-and-propensity-scores.html#cb36-50" tabindex="-1"></a><span class="co"># set up a matrix to store results</span></span>
-<span id="cb36-51"><a href="outcome-regression-and-propensity-scores.html#cb36-51" tabindex="-1"></a>boots <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">i =</span> <span class="dv">1</span><span class="sc">:</span>nboot,</span>
-<span id="cb36-52"><a href="outcome-regression-and-propensity-scores.html#cb36-52" tabindex="-1"></a>                    <span class="at">mean1 =</span> <span class="cn">NA</span>,</span>
-<span id="cb36-53"><a href="outcome-regression-and-propensity-scores.html#cb36-53" tabindex="-1"></a>                    <span class="at">mean0 =</span> <span class="cn">NA</span>,</span>
-<span id="cb36-54"><a href="outcome-regression-and-propensity-scores.html#cb36-54" tabindex="-1"></a>                    <span class="at">difference =</span> <span class="cn">NA</span>)</span>
-<span id="cb36-55"><a href="outcome-regression-and-propensity-scores.html#cb36-55" tabindex="-1"></a><span class="co"># loop to perform the bootstrapping</span></span>
-<span id="cb36-56"><a href="outcome-regression-and-propensity-scores.html#cb36-56" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">subset</span>(nhefs, <span class="sc">!</span><span class="fu">is.na</span>(ps) <span class="sc">&amp;</span> <span class="sc">!</span><span class="fu">is.na</span>(wt82_71)) <span class="co"># p.qsmk</span></span>
-<span id="cb36-57"><a href="outcome-regression-and-propensity-scores.html#cb36-57" tabindex="-1"></a><span class="cf">for</span>(i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
-<span id="cb36-58"><a href="outcome-regression-and-propensity-scores.html#cb36-58" tabindex="-1"></a>  <span class="co"># sample with replacement</span></span>
-<span id="cb36-59"><a href="outcome-regression-and-propensity-scores.html#cb36-59" tabindex="-1"></a>  sampl <span class="ot">&lt;-</span> nhefs[<span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span><span class="fu">nrow</span>(nhefs), <span class="fu">nrow</span>(nhefs), <span class="at">replace =</span> <span class="cn">TRUE</span>), ]</span>
-<span id="cb36-60"><a href="outcome-regression-and-propensity-scores.html#cb36-60" tabindex="-1"></a></span>
-<span id="cb36-61"><a href="outcome-regression-and-propensity-scores.html#cb36-61" tabindex="-1"></a>  <span class="co"># fit the model in the bootstrap sample</span></span>
-<span id="cb36-62"><a href="outcome-regression-and-propensity-scores.html#cb36-62" tabindex="-1"></a>  bootmod <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> ps, <span class="at">data =</span> sampl) <span class="co"># ps</span></span>
-<span id="cb36-63"><a href="outcome-regression-and-propensity-scores.html#cb36-63" tabindex="-1"></a></span>
-<span id="cb36-64"><a href="outcome-regression-and-propensity-scores.html#cb36-64" tabindex="-1"></a>  <span class="co"># create new datasets</span></span>
-<span id="cb36-65"><a href="outcome-regression-and-propensity-scores.html#cb36-65" tabindex="-1"></a>  sampl.treated <span class="ot">&lt;-</span> sampl <span class="sc">%&gt;%</span></span>
-<span id="cb36-66"><a href="outcome-regression-and-propensity-scores.html#cb36-66" tabindex="-1"></a>    <span class="fu">mutate</span>(<span class="at">qsmk =</span> <span class="dv">1</span>)</span>
-<span id="cb36-67"><a href="outcome-regression-and-propensity-scores.html#cb36-67" tabindex="-1"></a></span>
-<span id="cb36-68"><a href="outcome-regression-and-propensity-scores.html#cb36-68" tabindex="-1"></a>  sampl.untreated <span class="ot">&lt;-</span> sampl <span class="sc">%&gt;%</span></span>
-<span id="cb36-69"><a href="outcome-regression-and-propensity-scores.html#cb36-69" tabindex="-1"></a>    <span class="fu">mutate</span>(<span class="at">qsmk =</span> <span class="dv">0</span>)</span>
-<span id="cb36-70"><a href="outcome-regression-and-propensity-scores.html#cb36-70" tabindex="-1"></a></span>
-<span id="cb36-71"><a href="outcome-regression-and-propensity-scores.html#cb36-71" tabindex="-1"></a>  <span class="co"># predict values</span></span>
-<span id="cb36-72"><a href="outcome-regression-and-propensity-scores.html#cb36-72" tabindex="-1"></a>  sampl.treated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(bootmod, sampl.treated)</span>
-<span id="cb36-73"><a href="outcome-regression-and-propensity-scores.html#cb36-73" tabindex="-1"></a>  sampl.untreated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(bootmod, sampl.untreated)</span>
-<span id="cb36-74"><a href="outcome-regression-and-propensity-scores.html#cb36-74" tabindex="-1"></a></span>
-<span id="cb36-75"><a href="outcome-regression-and-propensity-scores.html#cb36-75" tabindex="-1"></a>  <span class="co"># output results</span></span>
-<span id="cb36-76"><a href="outcome-regression-and-propensity-scores.html#cb36-76" tabindex="-1"></a>  boots[i, <span class="st">&#39;mean1&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">mean</span>(sampl.treated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
-<span id="cb36-77"><a href="outcome-regression-and-propensity-scores.html#cb36-77" tabindex="-1"></a>  boots[i, <span class="st">&#39;mean0&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">mean</span>(sampl.untreated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
-<span id="cb36-78"><a href="outcome-regression-and-propensity-scores.html#cb36-78" tabindex="-1"></a>  boots[i, <span class="st">&#39;difference&#39;</span>] <span class="ot">&lt;-</span> boots[i, <span class="st">&#39;mean1&#39;</span>] <span class="sc">-</span> boots[i, <span class="st">&#39;mean0&#39;</span>]</span>
-<span id="cb36-79"><a href="outcome-regression-and-propensity-scores.html#cb36-79" tabindex="-1"></a></span>
-<span id="cb36-80"><a href="outcome-regression-and-propensity-scores.html#cb36-80" tabindex="-1"></a>  <span class="co"># once loop is done, print the results</span></span>
-<span id="cb36-81"><a href="outcome-regression-and-propensity-scores.html#cb36-81" tabindex="-1"></a>  <span class="cf">if</span>(i <span class="sc">==</span> nboot) {</span>
-<span id="cb36-82"><a href="outcome-regression-and-propensity-scores.html#cb36-82" tabindex="-1"></a>    <span class="fu">cat</span>(<span class="st">&#39;95% CI for the causal mean difference</span><span class="sc">\n</span><span class="st">&#39;</span>)</span>
-<span id="cb36-83"><a href="outcome-regression-and-propensity-scores.html#cb36-83" tabindex="-1"></a>    <span class="fu">cat</span>(<span class="fu">mean</span>(boots<span class="sc">$</span>difference) <span class="sc">-</span> <span class="fl">1.96</span><span class="sc">*</span><span class="fu">sd</span>(boots<span class="sc">$</span>difference),</span>
-<span id="cb36-84"><a href="outcome-regression-and-propensity-scores.html#cb36-84" tabindex="-1"></a>        <span class="st">&#39;,&#39;</span>,</span>
-<span id="cb36-85"><a href="outcome-regression-and-propensity-scores.html#cb36-85" tabindex="-1"></a>        <span class="fu">mean</span>(boots<span class="sc">$</span>difference) <span class="sc">+</span> <span class="fl">1.96</span><span class="sc">*</span><span class="fu">sd</span>(boots<span class="sc">$</span>difference))</span>
-<span id="cb36-86"><a href="outcome-regression-and-propensity-scores.html#cb36-86" tabindex="-1"></a>  }</span>
-<span id="cb36-87"><a href="outcome-regression-and-propensity-scores.html#cb36-87" tabindex="-1"></a>}</span>
-<span id="cb36-88"><a href="outcome-regression-and-propensity-scores.html#cb36-88" tabindex="-1"></a><span class="co">#&gt; 95% CI for the causal mean difference</span></span>
-<span id="cb36-89"><a href="outcome-regression-and-propensity-scores.html#cb36-89" tabindex="-1"></a><span class="co">#&gt; 2.723492 , 4.527558</span></span></code></pre></div>
+<div class="sourceCode" id="cb130"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb130-1"><a href="outcome-regression-and-propensity-scores.html#cb130-1" tabindex="-1"></a><span class="co">#install.packages(&quot;boot&quot;) # install package if required</span></span>
+<span id="cb130-2"><a href="outcome-regression-and-propensity-scores.html#cb130-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;boot&quot;</span>)</span>
+<span id="cb130-3"><a href="outcome-regression-and-propensity-scores.html#cb130-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb130-4"><a href="outcome-regression-and-propensity-scores.html#cb130-4" tabindex="-1"></a><span class="co">#&gt; Attaching package: &#39;boot&#39;</span></span>
+<span id="cb130-5"><a href="outcome-regression-and-propensity-scores.html#cb130-5" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:psych&#39;:</span></span>
+<span id="cb130-6"><a href="outcome-regression-and-propensity-scores.html#cb130-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb130-7"><a href="outcome-regression-and-propensity-scores.html#cb130-7" tabindex="-1"></a><span class="co">#&gt;     logit</span></span>
+<span id="cb130-8"><a href="outcome-regression-and-propensity-scores.html#cb130-8" tabindex="-1"></a><span class="co">#&gt; The following object is masked from &#39;package:survival&#39;:</span></span>
+<span id="cb130-9"><a href="outcome-regression-and-propensity-scores.html#cb130-9" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb130-10"><a href="outcome-regression-and-propensity-scores.html#cb130-10" tabindex="-1"></a><span class="co">#&gt;     aml</span></span></code></pre></div>
+<div class="sourceCode" id="cb131"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb131-1"><a href="outcome-regression-and-propensity-scores.html#cb131-1" tabindex="-1"></a></span>
+<span id="cb131-2"><a href="outcome-regression-and-propensity-scores.html#cb131-2" tabindex="-1"></a><span class="co"># standardization by propensity score, agnostic regarding effect modification</span></span>
+<span id="cb131-3"><a href="outcome-regression-and-propensity-scores.html#cb131-3" tabindex="-1"></a>std.ps <span class="ot">&lt;-</span> <span class="cf">function</span>(data, indices) {</span>
+<span id="cb131-4"><a href="outcome-regression-and-propensity-scores.html#cb131-4" tabindex="-1"></a>  d <span class="ot">&lt;-</span> data[indices,] <span class="co"># 1st copy: equal to original one`</span></span>
+<span id="cb131-5"><a href="outcome-regression-and-propensity-scores.html#cb131-5" tabindex="-1"></a>  <span class="co"># calculating propensity scores</span></span>
+<span id="cb131-6"><a href="outcome-regression-and-propensity-scores.html#cb131-6" tabindex="-1"></a>  ps.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(qsmk <span class="sc">~</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age<span class="sc">*</span>age)</span>
+<span id="cb131-7"><a href="outcome-regression-and-propensity-scores.html#cb131-7" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
+<span id="cb131-8"><a href="outcome-regression-and-propensity-scores.html#cb131-8" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeintensity<span class="sc">*</span>smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb131-9"><a href="outcome-regression-and-propensity-scores.html#cb131-9" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">I</span>(smokeyrs<span class="sc">*</span>smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb131-10"><a href="outcome-regression-and-propensity-scores.html#cb131-10" tabindex="-1"></a>                <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71<span class="sc">*</span>wt71),</span>
+<span id="cb131-11"><a href="outcome-regression-and-propensity-scores.html#cb131-11" tabindex="-1"></a>                <span class="at">data=</span>d, <span class="at">family=</span><span class="fu">binomial</span>())</span>
+<span id="cb131-12"><a href="outcome-regression-and-propensity-scores.html#cb131-12" tabindex="-1"></a>  d<span class="sc">$</span>pscore <span class="ot">&lt;-</span> <span class="fu">predict</span>(ps.fit, d, <span class="at">type=</span><span class="st">&quot;response&quot;</span>)</span>
+<span id="cb131-13"><a href="outcome-regression-and-propensity-scores.html#cb131-13" tabindex="-1"></a></span>
+<span id="cb131-14"><a href="outcome-regression-and-propensity-scores.html#cb131-14" tabindex="-1"></a>  <span class="co"># create a dataset with 3 copies of each subject</span></span>
+<span id="cb131-15"><a href="outcome-regression-and-propensity-scores.html#cb131-15" tabindex="-1"></a>  d<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span> <span class="co"># 1st copy: equal to original one`</span></span>
+<span id="cb131-16"><a href="outcome-regression-and-propensity-scores.html#cb131-16" tabindex="-1"></a>  d0 <span class="ot">&lt;-</span> d <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
+<span id="cb131-17"><a href="outcome-regression-and-propensity-scores.html#cb131-17" tabindex="-1"></a>  d0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb131-18"><a href="outcome-regression-and-propensity-scores.html#cb131-18" tabindex="-1"></a>  d0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb131-19"><a href="outcome-regression-and-propensity-scores.html#cb131-19" tabindex="-1"></a>  d0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb131-20"><a href="outcome-regression-and-propensity-scores.html#cb131-20" tabindex="-1"></a>  d1 <span class="ot">&lt;-</span> d <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
+<span id="cb131-21"><a href="outcome-regression-and-propensity-scores.html#cb131-21" tabindex="-1"></a>  d1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb131-22"><a href="outcome-regression-and-propensity-scores.html#cb131-22" tabindex="-1"></a>  d1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb131-23"><a href="outcome-regression-and-propensity-scores.html#cb131-23" tabindex="-1"></a>  d1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb131-24"><a href="outcome-regression-and-propensity-scores.html#cb131-24" tabindex="-1"></a>  d.onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(d, d0, d1) <span class="co"># combining datasets</span></span>
+<span id="cb131-25"><a href="outcome-regression-and-propensity-scores.html#cb131-25" tabindex="-1"></a></span>
+<span id="cb131-26"><a href="outcome-regression-and-propensity-scores.html#cb131-26" tabindex="-1"></a>  std.fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> pscore <span class="sc">+</span> <span class="fu">I</span>(qsmk<span class="sc">*</span>pscore), <span class="at">data=</span>d.onesample)</span>
+<span id="cb131-27"><a href="outcome-regression-and-propensity-scores.html#cb131-27" tabindex="-1"></a>  d.onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(std.fit, d.onesample)</span>
+<span id="cb131-28"><a href="outcome-regression-and-propensity-scores.html#cb131-28" tabindex="-1"></a></span>
+<span id="cb131-29"><a href="outcome-regression-and-propensity-scores.html#cb131-29" tabindex="-1"></a>  <span class="co"># estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1</span></span>
+<span id="cb131-30"><a href="outcome-regression-and-propensity-scores.html#cb131-30" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">c</span>(<span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==-</span><span class="dv">1</span>]),</span>
+<span id="cb131-31"><a href="outcome-regression-and-propensity-scores.html#cb131-31" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">0</span>]),</span>
+<span id="cb131-32"><a href="outcome-regression-and-propensity-scores.html#cb131-32" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">1</span>]),</span>
+<span id="cb131-33"><a href="outcome-regression-and-propensity-scores.html#cb131-33" tabindex="-1"></a>           <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">1</span>])<span class="sc">-</span></span>
+<span id="cb131-34"><a href="outcome-regression-and-propensity-scores.html#cb131-34" tabindex="-1"></a>             <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv<span class="sc">==</span><span class="dv">0</span>])))</span>
+<span id="cb131-35"><a href="outcome-regression-and-propensity-scores.html#cb131-35" tabindex="-1"></a>}</span>
+<span id="cb131-36"><a href="outcome-regression-and-propensity-scores.html#cb131-36" tabindex="-1"></a></span>
+<span id="cb131-37"><a href="outcome-regression-and-propensity-scores.html#cb131-37" tabindex="-1"></a><span class="co"># bootstrap</span></span>
+<span id="cb131-38"><a href="outcome-regression-and-propensity-scores.html#cb131-38" tabindex="-1"></a>results <span class="ot">&lt;-</span> <span class="fu">boot</span>(<span class="at">data=</span>nhefs, <span class="at">statistic=</span>std.ps, <span class="at">R=</span><span class="dv">5</span>)</span>
+<span id="cb131-39"><a href="outcome-regression-and-propensity-scores.html#cb131-39" tabindex="-1"></a></span>
+<span id="cb131-40"><a href="outcome-regression-and-propensity-scores.html#cb131-40" tabindex="-1"></a><span class="co"># generating confidence intervals</span></span>
+<span id="cb131-41"><a href="outcome-regression-and-propensity-scores.html#cb131-41" tabindex="-1"></a>se <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">1</span>]), <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">2</span>]),</span>
+<span id="cb131-42"><a href="outcome-regression-and-propensity-scores.html#cb131-42" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">3</span>]), <span class="fu">sd</span>(results<span class="sc">$</span>t[,<span class="dv">4</span>]))</span>
+<span id="cb131-43"><a href="outcome-regression-and-propensity-scores.html#cb131-43" tabindex="-1"></a>mean <span class="ot">&lt;-</span> results<span class="sc">$</span>t0</span>
+<span id="cb131-44"><a href="outcome-regression-and-propensity-scores.html#cb131-44" tabindex="-1"></a>ll <span class="ot">&lt;-</span> mean <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>se</span>
+<span id="cb131-45"><a href="outcome-regression-and-propensity-scores.html#cb131-45" tabindex="-1"></a>ul <span class="ot">&lt;-</span> mean <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>)<span class="sc">*</span>se</span>
+<span id="cb131-46"><a href="outcome-regression-and-propensity-scores.html#cb131-46" tabindex="-1"></a></span>
+<span id="cb131-47"><a href="outcome-regression-and-propensity-scores.html#cb131-47" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="fu">c</span>(<span class="st">&quot;Observed&quot;</span>, <span class="st">&quot;No Treatment&quot;</span>, <span class="st">&quot;Treatment&quot;</span>,</span>
+<span id="cb131-48"><a href="outcome-regression-and-propensity-scores.html#cb131-48" tabindex="-1"></a>                                <span class="st">&quot;Treatment - No Treatment&quot;</span>), mean, se, ll, ul))</span>
+<span id="cb131-49"><a href="outcome-regression-and-propensity-scores.html#cb131-49" tabindex="-1"></a>bootstrap</span>
+<span id="cb131-50"><a href="outcome-regression-and-propensity-scores.html#cb131-50" tabindex="-1"></a><span class="co">#&gt;                         V1             mean                se               ll</span></span>
+<span id="cb131-51"><a href="outcome-regression-and-propensity-scores.html#cb131-51" tabindex="-1"></a><span class="co">#&gt; 1                 Observed 2.63384609228479 0.257431993398983 2.12928865675443</span></span>
+<span id="cb131-52"><a href="outcome-regression-and-propensity-scores.html#cb131-52" tabindex="-1"></a><span class="co">#&gt; 2             No Treatment 1.71983636149845 0.231785902506788 1.26554434046104</span></span>
+<span id="cb131-53"><a href="outcome-regression-and-propensity-scores.html#cb131-53" tabindex="-1"></a><span class="co">#&gt; 3                Treatment 5.35072300362985 0.248611665961784 4.86345309220825</span></span>
+<span id="cb131-54"><a href="outcome-regression-and-propensity-scores.html#cb131-54" tabindex="-1"></a><span class="co">#&gt; 4 Treatment - No Treatment  3.6308866421314 0.284117716001535 3.07402615139861</span></span>
+<span id="cb131-55"><a href="outcome-regression-and-propensity-scores.html#cb131-55" tabindex="-1"></a><span class="co">#&gt;                 ul</span></span>
+<span id="cb131-56"><a href="outcome-regression-and-propensity-scores.html#cb131-56" tabindex="-1"></a><span class="co">#&gt; 1 3.13840352781515</span></span>
+<span id="cb131-57"><a href="outcome-regression-and-propensity-scores.html#cb131-57" tabindex="-1"></a><span class="co">#&gt; 2 2.17412838253587</span></span>
+<span id="cb131-58"><a href="outcome-regression-and-propensity-scores.html#cb131-58" tabindex="-1"></a><span class="co">#&gt; 3 5.83799291505145</span></span>
+<span id="cb131-59"><a href="outcome-regression-and-propensity-scores.html#cb131-59" tabindex="-1"></a><span class="co">#&gt; 4 4.18774713286419</span></span></code></pre></div>
+<div class="sourceCode" id="cb132"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb132-1"><a href="outcome-regression-and-propensity-scores.html#cb132-1" tabindex="-1"></a><span class="co"># regression on the propensity score (linear term)</span></span>
+<span id="cb132-2"><a href="outcome-regression-and-propensity-scores.html#cb132-2" tabindex="-1"></a>model6 <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> ps, <span class="at">data =</span> nhefs) <span class="co"># p.qsmk</span></span>
+<span id="cb132-3"><a href="outcome-regression-and-propensity-scores.html#cb132-3" tabindex="-1"></a><span class="fu">summary</span>(model6)</span>
+<span id="cb132-4"><a href="outcome-regression-and-propensity-scores.html#cb132-4" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb132-5"><a href="outcome-regression-and-propensity-scores.html#cb132-5" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb132-6"><a href="outcome-regression-and-propensity-scores.html#cb132-6" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + ps, data = nhefs)</span></span>
+<span id="cb132-7"><a href="outcome-regression-and-propensity-scores.html#cb132-7" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb132-8"><a href="outcome-regression-and-propensity-scores.html#cb132-8" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb132-9"><a href="outcome-regression-and-propensity-scores.html#cb132-9" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb132-10"><a href="outcome-regression-and-propensity-scores.html#cb132-10" tabindex="-1"></a><span class="co">#&gt; (Intercept)   5.5945     0.4831  11.581  &lt; 2e-16 ***</span></span>
+<span id="cb132-11"><a href="outcome-regression-and-propensity-scores.html#cb132-11" tabindex="-1"></a><span class="co">#&gt; qsmk          3.5506     0.4573   7.765 1.47e-14 ***</span></span>
+<span id="cb132-12"><a href="outcome-regression-and-propensity-scores.html#cb132-12" tabindex="-1"></a><span class="co">#&gt; ps          -14.8218     1.7576  -8.433  &lt; 2e-16 ***</span></span>
+<span id="cb132-13"><a href="outcome-regression-and-propensity-scores.html#cb132-13" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb132-14"><a href="outcome-regression-and-propensity-scores.html#cb132-14" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb132-15"><a href="outcome-regression-and-propensity-scores.html#cb132-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb132-16"><a href="outcome-regression-and-propensity-scores.html#cb132-16" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 58.28455)</span></span>
+<span id="cb132-17"><a href="outcome-regression-and-propensity-scores.html#cb132-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb132-18"><a href="outcome-regression-and-propensity-scores.html#cb132-18" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb132-19"><a href="outcome-regression-and-propensity-scores.html#cb132-19" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 91099  on 1563  degrees of freedom</span></span>
+<span id="cb132-20"><a href="outcome-regression-and-propensity-scores.html#cb132-20" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb132-21"><a href="outcome-regression-and-propensity-scores.html#cb132-21" tabindex="-1"></a><span class="co">#&gt; AIC: 10815</span></span>
+<span id="cb132-22"><a href="outcome-regression-and-propensity-scores.html#cb132-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb132-23"><a href="outcome-regression-and-propensity-scores.html#cb132-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb133"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb133-1"><a href="outcome-regression-and-propensity-scores.html#cb133-1" tabindex="-1"></a></span>
+<span id="cb133-2"><a href="outcome-regression-and-propensity-scores.html#cb133-2" tabindex="-1"></a><span class="co"># standarization on the propensity score</span></span>
+<span id="cb133-3"><a href="outcome-regression-and-propensity-scores.html#cb133-3" tabindex="-1"></a><span class="co"># (step 1) create two new datasets, one with all treated and one with all untreated</span></span>
+<span id="cb133-4"><a href="outcome-regression-and-propensity-scores.html#cb133-4" tabindex="-1"></a>treated <span class="ot">&lt;-</span> nhefs</span>
+<span id="cb133-5"><a href="outcome-regression-and-propensity-scores.html#cb133-5" tabindex="-1"></a>  treated<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb133-6"><a href="outcome-regression-and-propensity-scores.html#cb133-6" tabindex="-1"></a></span>
+<span id="cb133-7"><a href="outcome-regression-and-propensity-scores.html#cb133-7" tabindex="-1"></a>untreated <span class="ot">&lt;-</span> nhefs</span>
+<span id="cb133-8"><a href="outcome-regression-and-propensity-scores.html#cb133-8" tabindex="-1"></a>  untreated<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb133-9"><a href="outcome-regression-and-propensity-scores.html#cb133-9" tabindex="-1"></a></span>
+<span id="cb133-10"><a href="outcome-regression-and-propensity-scores.html#cb133-10" tabindex="-1"></a><span class="co"># (step 2) predict values for everyone in each new dataset based on above model</span></span>
+<span id="cb133-11"><a href="outcome-regression-and-propensity-scores.html#cb133-11" tabindex="-1"></a>treated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(model6, treated)</span>
+<span id="cb133-12"><a href="outcome-regression-and-propensity-scores.html#cb133-12" tabindex="-1"></a>untreated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(model6, untreated)</span>
+<span id="cb133-13"><a href="outcome-regression-and-propensity-scores.html#cb133-13" tabindex="-1"></a></span>
+<span id="cb133-14"><a href="outcome-regression-and-propensity-scores.html#cb133-14" tabindex="-1"></a><span class="co"># (step 3) compare mean weight loss had all been treated vs. that had all been untreated</span></span>
+<span id="cb133-15"><a href="outcome-regression-and-propensity-scores.html#cb133-15" tabindex="-1"></a>mean1 <span class="ot">&lt;-</span> <span class="fu">mean</span>(treated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb133-16"><a href="outcome-regression-and-propensity-scores.html#cb133-16" tabindex="-1"></a>mean0 <span class="ot">&lt;-</span> <span class="fu">mean</span>(untreated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb133-17"><a href="outcome-regression-and-propensity-scores.html#cb133-17" tabindex="-1"></a>mean1</span>
+<span id="cb133-18"><a href="outcome-regression-and-propensity-scores.html#cb133-18" tabindex="-1"></a><span class="co">#&gt; [1] 5.250824</span></span></code></pre></div>
+<div class="sourceCode" id="cb134"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb134-1"><a href="outcome-regression-and-propensity-scores.html#cb134-1" tabindex="-1"></a>mean0</span>
+<span id="cb134-2"><a href="outcome-regression-and-propensity-scores.html#cb134-2" tabindex="-1"></a><span class="co">#&gt; [1] 1.700228</span></span></code></pre></div>
+<div class="sourceCode" id="cb135"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb135-1"><a href="outcome-regression-and-propensity-scores.html#cb135-1" tabindex="-1"></a>mean1 <span class="sc">-</span> mean0</span>
+<span id="cb135-2"><a href="outcome-regression-and-propensity-scores.html#cb135-2" tabindex="-1"></a><span class="co">#&gt; [1] 3.550596</span></span></code></pre></div>
+<div class="sourceCode" id="cb136"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb136-1"><a href="outcome-regression-and-propensity-scores.html#cb136-1" tabindex="-1"></a></span>
+<span id="cb136-2"><a href="outcome-regression-and-propensity-scores.html#cb136-2" tabindex="-1"></a><span class="co"># (step 4) bootstrap a confidence interval</span></span>
+<span id="cb136-3"><a href="outcome-regression-and-propensity-scores.html#cb136-3" tabindex="-1"></a><span class="co"># number of bootstraps</span></span>
+<span id="cb136-4"><a href="outcome-regression-and-propensity-scores.html#cb136-4" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">100</span></span>
+<span id="cb136-5"><a href="outcome-regression-and-propensity-scores.html#cb136-5" tabindex="-1"></a><span class="co"># set up a matrix to store results</span></span>
+<span id="cb136-6"><a href="outcome-regression-and-propensity-scores.html#cb136-6" tabindex="-1"></a>boots <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">i =</span> <span class="dv">1</span><span class="sc">:</span>nboot,</span>
+<span id="cb136-7"><a href="outcome-regression-and-propensity-scores.html#cb136-7" tabindex="-1"></a>                    <span class="at">mean1 =</span> <span class="cn">NA</span>,</span>
+<span id="cb136-8"><a href="outcome-regression-and-propensity-scores.html#cb136-8" tabindex="-1"></a>                    <span class="at">mean0 =</span> <span class="cn">NA</span>,</span>
+<span id="cb136-9"><a href="outcome-regression-and-propensity-scores.html#cb136-9" tabindex="-1"></a>                    <span class="at">difference =</span> <span class="cn">NA</span>)</span>
+<span id="cb136-10"><a href="outcome-regression-and-propensity-scores.html#cb136-10" tabindex="-1"></a><span class="co"># loop to perform the bootstrapping</span></span>
+<span id="cb136-11"><a href="outcome-regression-and-propensity-scores.html#cb136-11" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">subset</span>(nhefs, <span class="sc">!</span><span class="fu">is.na</span>(ps) <span class="sc">&amp;</span> <span class="sc">!</span><span class="fu">is.na</span>(wt82_71)) <span class="co"># p.qsmk</span></span>
+<span id="cb136-12"><a href="outcome-regression-and-propensity-scores.html#cb136-12" tabindex="-1"></a><span class="cf">for</span>(i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
+<span id="cb136-13"><a href="outcome-regression-and-propensity-scores.html#cb136-13" tabindex="-1"></a>  <span class="co"># sample with replacement</span></span>
+<span id="cb136-14"><a href="outcome-regression-and-propensity-scores.html#cb136-14" tabindex="-1"></a>  sampl <span class="ot">&lt;-</span> nhefs[<span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span><span class="fu">nrow</span>(nhefs), <span class="fu">nrow</span>(nhefs), <span class="at">replace =</span> <span class="cn">TRUE</span>), ]</span>
+<span id="cb136-15"><a href="outcome-regression-and-propensity-scores.html#cb136-15" tabindex="-1"></a></span>
+<span id="cb136-16"><a href="outcome-regression-and-propensity-scores.html#cb136-16" tabindex="-1"></a>  <span class="co"># fit the model in the bootstrap sample</span></span>
+<span id="cb136-17"><a href="outcome-regression-and-propensity-scores.html#cb136-17" tabindex="-1"></a>  bootmod <span class="ot">&lt;-</span> <span class="fu">glm</span>(wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> ps, <span class="at">data =</span> sampl) <span class="co"># ps</span></span>
+<span id="cb136-18"><a href="outcome-regression-and-propensity-scores.html#cb136-18" tabindex="-1"></a></span>
+<span id="cb136-19"><a href="outcome-regression-and-propensity-scores.html#cb136-19" tabindex="-1"></a>  <span class="co"># create new datasets</span></span>
+<span id="cb136-20"><a href="outcome-regression-and-propensity-scores.html#cb136-20" tabindex="-1"></a>  sampl.treated <span class="ot">&lt;-</span> sampl <span class="sc">%&gt;%</span></span>
+<span id="cb136-21"><a href="outcome-regression-and-propensity-scores.html#cb136-21" tabindex="-1"></a>    <span class="fu">mutate</span>(<span class="at">qsmk =</span> <span class="dv">1</span>)</span>
+<span id="cb136-22"><a href="outcome-regression-and-propensity-scores.html#cb136-22" tabindex="-1"></a></span>
+<span id="cb136-23"><a href="outcome-regression-and-propensity-scores.html#cb136-23" tabindex="-1"></a>  sampl.untreated <span class="ot">&lt;-</span> sampl <span class="sc">%&gt;%</span></span>
+<span id="cb136-24"><a href="outcome-regression-and-propensity-scores.html#cb136-24" tabindex="-1"></a>    <span class="fu">mutate</span>(<span class="at">qsmk =</span> <span class="dv">0</span>)</span>
+<span id="cb136-25"><a href="outcome-regression-and-propensity-scores.html#cb136-25" tabindex="-1"></a></span>
+<span id="cb136-26"><a href="outcome-regression-and-propensity-scores.html#cb136-26" tabindex="-1"></a>  <span class="co"># predict values</span></span>
+<span id="cb136-27"><a href="outcome-regression-and-propensity-scores.html#cb136-27" tabindex="-1"></a>  sampl.treated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(bootmod, sampl.treated)</span>
+<span id="cb136-28"><a href="outcome-regression-and-propensity-scores.html#cb136-28" tabindex="-1"></a>  sampl.untreated<span class="sc">$</span>pred.y <span class="ot">&lt;-</span> <span class="fu">predict</span>(bootmod, sampl.untreated)</span>
+<span id="cb136-29"><a href="outcome-regression-and-propensity-scores.html#cb136-29" tabindex="-1"></a></span>
+<span id="cb136-30"><a href="outcome-regression-and-propensity-scores.html#cb136-30" tabindex="-1"></a>  <span class="co"># output results</span></span>
+<span id="cb136-31"><a href="outcome-regression-and-propensity-scores.html#cb136-31" tabindex="-1"></a>  boots[i, <span class="st">&#39;mean1&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">mean</span>(sampl.treated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb136-32"><a href="outcome-regression-and-propensity-scores.html#cb136-32" tabindex="-1"></a>  boots[i, <span class="st">&#39;mean0&#39;</span>] <span class="ot">&lt;-</span> <span class="fu">mean</span>(sampl.untreated<span class="sc">$</span>pred.y, <span class="at">na.rm =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb136-33"><a href="outcome-regression-and-propensity-scores.html#cb136-33" tabindex="-1"></a>  boots[i, <span class="st">&#39;difference&#39;</span>] <span class="ot">&lt;-</span> boots[i, <span class="st">&#39;mean1&#39;</span>] <span class="sc">-</span> boots[i, <span class="st">&#39;mean0&#39;</span>]</span>
+<span id="cb136-34"><a href="outcome-regression-and-propensity-scores.html#cb136-34" tabindex="-1"></a></span>
+<span id="cb136-35"><a href="outcome-regression-and-propensity-scores.html#cb136-35" tabindex="-1"></a>  <span class="co"># once loop is done, print the results</span></span>
+<span id="cb136-36"><a href="outcome-regression-and-propensity-scores.html#cb136-36" tabindex="-1"></a>  <span class="cf">if</span>(i <span class="sc">==</span> nboot) {</span>
+<span id="cb136-37"><a href="outcome-regression-and-propensity-scores.html#cb136-37" tabindex="-1"></a>    <span class="fu">cat</span>(<span class="st">&#39;95% CI for the causal mean difference</span><span class="sc">\n</span><span class="st">&#39;</span>)</span>
+<span id="cb136-38"><a href="outcome-regression-and-propensity-scores.html#cb136-38" tabindex="-1"></a>    <span class="fu">cat</span>(<span class="fu">mean</span>(boots<span class="sc">$</span>difference) <span class="sc">-</span> <span class="fl">1.96</span><span class="sc">*</span><span class="fu">sd</span>(boots<span class="sc">$</span>difference),</span>
+<span id="cb136-39"><a href="outcome-regression-and-propensity-scores.html#cb136-39" tabindex="-1"></a>        <span class="st">&#39;,&#39;</span>,</span>
+<span id="cb136-40"><a href="outcome-regression-and-propensity-scores.html#cb136-40" tabindex="-1"></a>        <span class="fu">mean</span>(boots<span class="sc">$</span>difference) <span class="sc">+</span> <span class="fl">1.96</span><span class="sc">*</span><span class="fu">sd</span>(boots<span class="sc">$</span>difference))</span>
+<span id="cb136-41"><a href="outcome-regression-and-propensity-scores.html#cb136-41" tabindex="-1"></a>  }</span>
+<span id="cb136-42"><a href="outcome-regression-and-propensity-scores.html#cb136-42" tabindex="-1"></a>}</span>
+<span id="cb136-43"><a href="outcome-regression-and-propensity-scores.html#cb136-43" tabindex="-1"></a><span class="co">#&gt; 95% CI for the causal mean difference</span></span>
+<span id="cb136-44"><a href="outcome-regression-and-propensity-scores.html#cb136-44" tabindex="-1"></a><span class="co">#&gt; 2.585806 , 4.616634</span></span></code></pre></div>
 <p>A more flexible and elegant way to do this is to write a function to perform the model fitting, prediction, bootstrapping, and reporting all at once.</p>
 
 </div>
diff --git a/docs/search_index.json b/docs/search_index.json
index 5dcbe7c..cba46d4 100644
--- a/docs/search_index.json
+++ b/docs/search_index.json
@@ -1 +1 @@
-[["index.html", "Causal Inference: What If. R and Stata code for Exercises Preface Downloading the code Installing dependency packages Downloading the datasets", " Causal Inference: What If. R and Stata code for Exercises Book by M. A. Hernán and J. M. Robins R code by Joy Shi and Sean McGrath Stata code by Eleanor Murray and Roger Logan R Markdown code by Tom Palmer 25 April 2024 Preface This book presents code examples from Hernán and Robins (2020), which is available in draft form from the following webpage. https://www.hsph.harvard.edu/miguel-hernan/causal-inference-book/ The R code is based on the code by Joy Shi and Sean McGrath given here. The Stata code is based on the code by Eleanor Murray and Roger Logan given here. This repo is rendered at https://remlapmot.github.io/cibookex-r/. Click the download button above for the pdf and eBook versions. Downloading the code The repo is available on GitHub here. There are a number of ways to download the code. Either, click the green Clone or download button then choose to Open in Desktop or Download ZIP. The Desktop option means open in the GitHub Desktop app (if you have that installed on your machine). The ZIP option will give you a zip archive of the repo, which you then unzip. or fork the repo into your own GitHub account and then clone or download your forked repo to your machine. Installing dependency packages It is easiest to open the repo in RStudio, as an RStudio project, by doubling click the .Rproj file. This makes sure that R’s working directory is at the top level of the repo. If you don’t want to open the repo as a project set the working directory to the top level of the repo directories using setwd(). Then run: # install.packages(&quot;devtools&quot;) # uncomment if devtools not installed devtools::install_dev_deps() Downloading the datasets We assume that you have downloaded the data from the Causal Inference Book website and saved it to a data subdirectory. You can do this manually or with the following code (nb. we use the here package to reference the data subdirectory). library(here) dataurls &lt;- list() stub &lt;- &quot;https://cdn1.sph.harvard.edu/wp-content/uploads/sites/1268/&quot; dataurls[[1]] &lt;- paste0(stub, &quot;2012/10/nhefs_sas.zip&quot;) dataurls[[2]] &lt;- paste0(stub, &quot;2012/10/nhefs_stata.zip&quot;) dataurls[[3]] &lt;- paste0(stub, &quot;2017/01/nhefs_excel.zip&quot;) dataurls[[4]] &lt;- paste0(stub, &quot;1268/20/nhefs.csv&quot;) temp &lt;- tempfile() for (i in 1:3) { download.file(dataurls[[i]], temp) unzip(temp, exdir = &quot;data&quot;) } download.file(dataurls[[4]], here(&quot;data&quot;, &quot;nhefs.csv&quot;)) References Hernán, Miguel A, and James M Robins. 2020. Causal Inference: What If. Boca Raton: Chapman &amp; Hall/CRC. "],["why-model.html", "11. Why model? Program 11.1 Program 11.2 Program 11.3", " 11. Why model? Program 11.1 Sample averages by treatment level Data from Figures 11.1 and 11.2 A &lt;- c(1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0) Y &lt;- c(200, 150, 220, 110, 50, 180, 90, 170, 170, 30, 70, 110, 80, 50, 10, 20) plot(A, Y) summary(Y[A == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 10.0 27.5 60.0 67.5 87.5 170.0 summary(Y[A == 1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 50.0 105.0 160.0 146.2 185.0 220.0 A2 &lt;- c(1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4) Y2 &lt;- c(110, 80, 50, 40, 170, 30, 70, 50, 110, 50, 180, 130, 200, 150, 220, 210) plot(A2, Y2) summary(Y2[A2 == 1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 40.0 47.5 65.0 70.0 87.5 110.0 summary(Y2[A2 == 2]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 30 45 60 80 95 170 summary(Y2[A2 == 3]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 50.0 95.0 120.0 117.5 142.5 180.0 summary(Y2[A2 == 4]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 150.0 187.5 205.0 195.0 212.5 220.0 Program 11.2 2-parameter linear model Data from Figures 11.3 and 11.1 A3 &lt;- c(3, 11, 17, 23, 29, 37, 41, 53, 67, 79, 83, 97, 60, 71, 15, 45) Y3 &lt;- c(21, 54, 33, 101, 85, 65, 157, 120, 111, 200, 140, 220, 230, 217, 11, 190) plot(Y3 ~ A3) summary(glm(Y3 ~ A3)) #&gt; #&gt; Call: #&gt; glm(formula = Y3 ~ A3) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 24.5464 21.3300 1.151 0.269094 #&gt; A3 2.1372 0.3997 5.347 0.000103 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 1944.109) #&gt; #&gt; Null deviance: 82800 on 15 degrees of freedom #&gt; Residual deviance: 27218 on 14 degrees of freedom #&gt; AIC: 170.43 #&gt; #&gt; Number of Fisher Scoring iterations: 2 predict(glm(Y3 ~ A3), data.frame(A3 = 90)) #&gt; 1 #&gt; 216.89 summary(glm(Y ~ A)) #&gt; #&gt; Call: #&gt; glm(formula = Y ~ A) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 67.50 19.72 3.424 0.00412 ** #&gt; A 78.75 27.88 2.824 0.01352 * #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 3109.821) #&gt; #&gt; Null deviance: 68344 on 15 degrees of freedom #&gt; Residual deviance: 43538 on 14 degrees of freedom #&gt; AIC: 177.95 #&gt; #&gt; Number of Fisher Scoring iterations: 2 Program 11.3 3-parameter linear model Data from Figure 11.3 Asq &lt;- A3 * A3 mod3 &lt;- glm(Y3 ~ A3 + Asq) summary(mod3) #&gt; #&gt; Call: #&gt; glm(formula = Y3 ~ A3 + Asq) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -7.40688 31.74777 -0.233 0.8192 #&gt; A3 4.10723 1.53088 2.683 0.0188 * #&gt; Asq -0.02038 0.01532 -1.331 0.2062 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 1842.697) #&gt; #&gt; Null deviance: 82800 on 15 degrees of freedom #&gt; Residual deviance: 23955 on 13 degrees of freedom #&gt; AIC: 170.39 #&gt; #&gt; Number of Fisher Scoring iterations: 2 predict(mod3, data.frame(cbind(A3 = 90, Asq = 8100))) #&gt; 1 #&gt; 197.1269 "],["ip-weighting-and-marginal-structural-models.html", "12. IP Weighting and Marginal Structural Models Program 12.1 Program 12.2 Program 12.3 Program 12.4 Program 12.5 Program 12.6 Program 12.7", " 12. IP Weighting and Marginal Structural Models Program 12.1 Descriptive statistics from NHEFS data (Table 12.1) library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # provisionally ignore subjects with missing values for weight in 1982 nhefs.nmv &lt;- nhefs[which(!is.na(nhefs$wt82)),] lm(wt82_71 ~ qsmk, data = nhefs.nmv) #&gt; #&gt; Call: #&gt; lm(formula = wt82_71 ~ qsmk, data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; (Intercept) qsmk #&gt; 1.984 2.541 # Smoking cessation predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 1)) #&gt; 1 #&gt; 4.525079 # No smoking cessation predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 0)) #&gt; 1 #&gt; 1.984498 # Table summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$age) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 25.00 33.00 42.00 42.79 51.00 72.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 40.82 59.19 68.49 70.30 79.38 151.73 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeintensity) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 20.00 21.19 30.00 60.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeyrs) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 23.00 24.09 32.00 64.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$age) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 25.00 35.00 46.00 46.17 56.00 74.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 39.58 60.67 71.21 72.35 81.08 136.98 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeintensity) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.0 10.0 20.0 18.6 25.0 80.0 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeyrs) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 26.00 26.03 35.00 60.00 table(nhefs.nmv$qsmk, nhefs.nmv$sex) #&gt; #&gt; 0 1 #&gt; 0 542 621 #&gt; 1 220 183 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$sex), 1) #&gt; #&gt; 0 1 #&gt; 0 0.4660361 0.5339639 #&gt; 1 0.5459057 0.4540943 table(nhefs.nmv$qsmk, nhefs.nmv$race) #&gt; #&gt; 0 1 #&gt; 0 993 170 #&gt; 1 367 36 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$race), 1) #&gt; #&gt; 0 1 #&gt; 0 0.85382631 0.14617369 #&gt; 1 0.91066998 0.08933002 table(nhefs.nmv$qsmk, nhefs.nmv$education) #&gt; #&gt; 1 2 3 4 5 #&gt; 0 210 266 480 92 115 #&gt; 1 81 74 157 29 62 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$education), 1) #&gt; #&gt; 1 2 3 4 5 #&gt; 0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220 #&gt; 1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615 table(nhefs.nmv$qsmk, nhefs.nmv$exercise) #&gt; #&gt; 0 1 2 #&gt; 0 237 485 441 #&gt; 1 63 176 164 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$exercise), 1) #&gt; #&gt; 0 1 2 #&gt; 0 0.2037833 0.4170249 0.3791917 #&gt; 1 0.1563275 0.4367246 0.4069479 table(nhefs.nmv$qsmk, nhefs.nmv$active) #&gt; #&gt; 0 1 2 #&gt; 0 532 527 104 #&gt; 1 170 188 45 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$active), 1) #&gt; #&gt; 0 1 2 #&gt; 0 0.4574377 0.4531384 0.0894239 #&gt; 1 0.4218362 0.4665012 0.1116625 Program 12.2 Estimating IP weights Data from NHEFS # Estimation of ip weights via a logistic model fit &lt;- glm( qsmk ~ sex + race + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + #&gt; as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), #&gt; family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.2425191 1.3808360 -1.624 0.104369 #&gt; sex -0.5274782 0.1540496 -3.424 0.000617 *** #&gt; race -0.8392636 0.2100665 -3.995 6.46e-05 *** #&gt; age 0.1212052 0.0512663 2.364 0.018068 * #&gt; I(age^2) -0.0008246 0.0005361 -1.538 0.124039 #&gt; as.factor(education)2 -0.0287755 0.1983506 -0.145 0.884653 #&gt; as.factor(education)3 0.0864318 0.1780850 0.485 0.627435 #&gt; as.factor(education)4 0.0636010 0.2732108 0.233 0.815924 #&gt; as.factor(education)5 0.4759606 0.2262237 2.104 0.035384 * #&gt; smokeintensity -0.0772704 0.0152499 -5.067 4.04e-07 *** #&gt; I(smokeintensity^2) 0.0010451 0.0002866 3.647 0.000265 *** #&gt; smokeyrs -0.0735966 0.0277775 -2.650 0.008061 ** #&gt; I(smokeyrs^2) 0.0008441 0.0004632 1.822 0.068398 . #&gt; as.factor(exercise)1 0.3548405 0.1801351 1.970 0.048855 * #&gt; as.factor(exercise)2 0.3957040 0.1872400 2.113 0.034571 * #&gt; as.factor(active)1 0.0319445 0.1329372 0.240 0.810100 #&gt; as.factor(active)2 0.1767840 0.2149720 0.822 0.410873 #&gt; wt71 -0.0152357 0.0263161 -0.579 0.562625 #&gt; I(wt71^2) 0.0001352 0.0001632 0.829 0.407370 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1714.9 #&gt; #&gt; Number of Fisher Scoring iterations: 4 p.qsmk.obs &lt;- ifelse(nhefs.nmv$qsmk == 0, 1 - predict(fit, type = &quot;response&quot;), predict(fit, type = &quot;response&quot;)) nhefs.nmv$w &lt;- 1 / p.qsmk.obs summary(nhefs.nmv$w) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.054 1.230 1.373 1.996 1.990 16.700 sd(nhefs.nmv$w) #&gt; [1] 1.474787 # install.packages(&quot;geepack&quot;) # install package if required library(&quot;geepack&quot;) msm.w &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, id = seqn, corstr = &quot;independence&quot; ) summary(msm.w) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.7800 0.2247 62.73 2.33e-15 *** #&gt; qsmk 3.4405 0.5255 42.87 5.86e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 65.06 4.221 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.w) SE &lt;- coef(summary(msm.w))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.780 1.340 2.22 #&gt; qsmk 3.441 2.411 4.47 # no association between sex and qsmk in pseudo-population xtabs(nhefs.nmv$w ~ nhefs.nmv$sex + nhefs.nmv$qsmk) #&gt; nhefs.nmv$qsmk #&gt; nhefs.nmv$sex 0 1 #&gt; 0 763.6 763.6 #&gt; 1 801.7 797.2 # &quot;check&quot; for positivity (White women) table(nhefs.nmv$age[nhefs.nmv$race == 0 &amp; nhefs.nmv$sex == 1], nhefs.nmv$qsmk[nhefs.nmv$race == 0 &amp; nhefs.nmv$sex == 1]) #&gt; #&gt; 0 1 #&gt; 25 24 3 #&gt; 26 14 5 #&gt; 27 18 2 #&gt; 28 20 5 #&gt; 29 15 4 #&gt; 30 14 5 #&gt; 31 11 5 #&gt; 32 14 7 #&gt; 33 12 3 #&gt; 34 22 5 #&gt; 35 16 5 #&gt; 36 13 3 #&gt; 37 14 1 #&gt; 38 6 2 #&gt; 39 19 4 #&gt; 40 10 4 #&gt; 41 13 3 #&gt; 42 16 3 #&gt; 43 14 3 #&gt; 44 9 4 #&gt; 45 12 5 #&gt; 46 19 4 #&gt; 47 19 4 #&gt; 48 19 4 #&gt; 49 11 3 #&gt; 50 18 4 #&gt; 51 9 3 #&gt; 52 11 3 #&gt; 53 11 4 #&gt; 54 17 9 #&gt; 55 9 4 #&gt; 56 8 7 #&gt; 57 9 2 #&gt; 58 8 4 #&gt; 59 5 4 #&gt; 60 5 4 #&gt; 61 5 2 #&gt; 62 6 5 #&gt; 63 3 3 #&gt; 64 7 1 #&gt; 65 3 2 #&gt; 66 4 0 #&gt; 67 2 0 #&gt; 69 6 2 #&gt; 70 2 1 #&gt; 71 0 1 #&gt; 72 2 2 #&gt; 74 0 1 Program 12.3 Estimating stabilized IP weights Data from NHEFS # estimation of denominator of ip weights denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.242519 1.380836 -1.62 0.10437 #&gt; as.factor(sex)1 -0.527478 0.154050 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.839264 0.210067 -4.00 6.5e-05 *** #&gt; age 0.121205 0.051266 2.36 0.01807 * #&gt; I(age^2) -0.000825 0.000536 -1.54 0.12404 #&gt; as.factor(education)2 -0.028776 0.198351 -0.15 0.88465 #&gt; as.factor(education)3 0.086432 0.178085 0.49 0.62744 #&gt; as.factor(education)4 0.063601 0.273211 0.23 0.81592 #&gt; as.factor(education)5 0.475961 0.226224 2.10 0.03538 * #&gt; smokeintensity -0.077270 0.015250 -5.07 4.0e-07 *** #&gt; I(smokeintensity^2) 0.001045 0.000287 3.65 0.00027 *** #&gt; smokeyrs -0.073597 0.027777 -2.65 0.00806 ** #&gt; I(smokeyrs^2) 0.000844 0.000463 1.82 0.06840 . #&gt; as.factor(exercise)1 0.354841 0.180135 1.97 0.04885 * #&gt; as.factor(exercise)2 0.395704 0.187240 2.11 0.03457 * #&gt; as.factor(active)1 0.031944 0.132937 0.24 0.81010 #&gt; as.factor(active)2 0.176784 0.214972 0.82 0.41087 #&gt; wt71 -0.015236 0.026316 -0.58 0.56262 #&gt; I(wt71^2) 0.000135 0.000163 0.83 0.40737 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1715 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights numer.fit &lt;- glm(qsmk ~ 1, family = binomial(), data = nhefs.nmv) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.0598 0.0578 -18.3 &lt;2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1786.1 on 1565 degrees of freedom #&gt; AIC: 1788 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) nhefs.nmv$sw &lt;- ifelse(nhefs.nmv$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) summary(nhefs.nmv$sw) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.331 0.867 0.950 0.999 1.079 4.298 msm.sw &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.780 0.225 62.7 2.3e-15 *** #&gt; qsmk 3.441 0.525 42.9 5.9e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.7 3.71 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.sw) SE &lt;- coef(summary(msm.sw))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.78 1.34 2.22 #&gt; qsmk 3.44 2.41 4.47 # no association between sex and qsmk in pseudo-population xtabs(nhefs.nmv$sw ~ nhefs.nmv$sex + nhefs.nmv$qsmk) #&gt; nhefs.nmv$qsmk #&gt; nhefs.nmv$sex 0 1 #&gt; 0 567 197 #&gt; 1 595 205 Program 12.4 Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS # Analysis restricted to subjects reporting &lt;=25 cig/day at baseline nhefs.nmv.s &lt;- subset(nhefs.nmv, smokeintensity &lt;= 25) # estimation of denominator of ip weights den.fit.obj &lt;- lm( smkintensity82_71 ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), data = nhefs.nmv.s ) p.den &lt;- predict(den.fit.obj, type = &quot;response&quot;) dens.den &lt;- dnorm(nhefs.nmv.s$smkintensity82_71, p.den, summary(den.fit.obj)$sigma) # estimation of numerator of ip weights num.fit.obj &lt;- lm(smkintensity82_71 ~ 1, data = nhefs.nmv.s) p.num &lt;- predict(num.fit.obj, type = &quot;response&quot;) dens.num &lt;- dnorm(nhefs.nmv.s$smkintensity82_71, p.num, summary(num.fit.obj)$sigma) nhefs.nmv.s$sw.a &lt;- dens.num / dens.den summary(nhefs.nmv.s$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.19 0.89 0.97 1.00 1.05 5.10 msm.sw.cont &lt;- geeglm( wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw.cont) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * #&gt; smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, #&gt; corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 2.00452 0.29512 46.13 1.1e-11 *** #&gt; smkintensity82_71 -0.10899 0.03154 11.94 0.00055 *** #&gt; I(smkintensity82_71 * smkintensity82_71) 0.00269 0.00242 1.24 0.26489 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.5 4.5 #&gt; Number of clusters: 1162 Maximum cluster size: 1 beta &lt;- coef(msm.sw.cont) SE &lt;- coef(summary(msm.sw.cont))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 2.00452 1.42610 2.58295 #&gt; smkintensity82_71 -0.10899 -0.17080 -0.04718 #&gt; I(smkintensity82_71 * smkintensity82_71) 0.00269 -0.00204 0.00743 Program 12.5 Estimating the parameters of a marginal structural logistic model Data from NHEFS table(nhefs.nmv$qsmk, nhefs.nmv$death) #&gt; #&gt; 0 1 #&gt; 0 963 200 #&gt; 1 312 91 # First, estimation of stabilized weights sw (same as in Program 12.3) # Second, fit logistic model below msm.logistic &lt;- geeglm( death ~ qsmk, data = nhefs.nmv, weights = sw, id = seqn, family = binomial(), corstr = &quot;independence&quot; ) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(msm.logistic) #&gt; #&gt; Call: #&gt; geeglm(formula = death ~ qsmk, family = binomial(), data = nhefs.nmv, #&gt; weights = sw, id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) -1.4905 0.0789 356.50 &lt;2e-16 *** #&gt; qsmk 0.0301 0.1573 0.04 0.85 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 1 0.0678 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.logistic) SE &lt;- coef(summary(msm.logistic))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) -1.4905 -1.645 -1.336 #&gt; qsmk 0.0301 -0.278 0.338 Program 12.6 Assessing effect modification by sex using a marginal structural mean model Data from NHEFS table(nhefs.nmv$sex) #&gt; #&gt; 0 1 #&gt; 762 804 # estimation of denominator of ip weights denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.242519 1.380836 -1.62 0.10437 #&gt; as.factor(sex)1 -0.527478 0.154050 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.839264 0.210067 -4.00 6.5e-05 *** #&gt; age 0.121205 0.051266 2.36 0.01807 * #&gt; I(age^2) -0.000825 0.000536 -1.54 0.12404 #&gt; as.factor(education)2 -0.028776 0.198351 -0.15 0.88465 #&gt; as.factor(education)3 0.086432 0.178085 0.49 0.62744 #&gt; as.factor(education)4 0.063601 0.273211 0.23 0.81592 #&gt; as.factor(education)5 0.475961 0.226224 2.10 0.03538 * #&gt; smokeintensity -0.077270 0.015250 -5.07 4.0e-07 *** #&gt; I(smokeintensity^2) 0.001045 0.000287 3.65 0.00027 *** #&gt; smokeyrs -0.073597 0.027777 -2.65 0.00806 ** #&gt; I(smokeyrs^2) 0.000844 0.000463 1.82 0.06840 . #&gt; as.factor(exercise)1 0.354841 0.180135 1.97 0.04885 * #&gt; as.factor(exercise)2 0.395704 0.187240 2.11 0.03457 * #&gt; as.factor(active)1 0.031944 0.132937 0.24 0.81010 #&gt; as.factor(active)2 0.176784 0.214972 0.82 0.41087 #&gt; wt71 -0.015236 0.026316 -0.58 0.56262 #&gt; I(wt71^2) 0.000135 0.000163 0.83 0.40737 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1715 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights numer.fit &lt;- glm(qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -0.9016 0.0799 -11.28 &lt;2e-16 *** #&gt; as.factor(sex)1 -0.3202 0.1160 -2.76 0.0058 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1778.4 on 1564 degrees of freedom #&gt; AIC: 1782 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) nhefs.nmv$sw.a &lt;- ifelse(nhefs.nmv$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) summary(nhefs.nmv$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.29 0.88 0.96 1.00 1.08 3.80 sd(nhefs.nmv$sw.a) #&gt; [1] 0.271 # Estimating parameters of a marginal structural mean model msm.emm &lt;- geeglm( wt82_71 ~ as.factor(qsmk) + as.factor(sex) + as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, id = seqn, corstr = &quot;independence&quot; ) summary(msm.emm) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ as.factor(qsmk) + as.factor(sex) + #&gt; as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.78445 0.30984 33.17 8.5e-09 *** #&gt; as.factor(qsmk)1 3.52198 0.65707 28.73 8.3e-08 *** #&gt; as.factor(sex)1 -0.00872 0.44882 0.00 0.98 #&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 1.04608 0.02 0.88 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.8 3.71 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.emm) SE &lt;- coef(summary(msm.emm))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.78445 1.177 2.392 #&gt; as.factor(qsmk)1 3.52198 2.234 4.810 #&gt; as.factor(sex)1 -0.00872 -0.888 0.871 #&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 -2.210 1.891 Program 12.7 Estimating IP weights to adjust for selection bias due to censoring Data from NHEFS table(nhefs$qsmk, nhefs$cens) #&gt; #&gt; 0 1 #&gt; 0 1163 38 #&gt; 1 403 25 summary(nhefs[which(nhefs$cens == 0),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 39.6 59.5 69.2 70.8 79.8 151.7 summary(nhefs[which(nhefs$cens == 1),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 36.2 63.1 72.1 76.6 87.9 169.2 # estimation of denominator of ip weights for A denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.988902 1.241279 -1.60 0.10909 #&gt; as.factor(sex)1 -0.507522 0.148232 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.850231 0.205872 -4.13 3.6e-05 *** #&gt; age 0.103013 0.048900 2.11 0.03515 * #&gt; I(age^2) -0.000605 0.000507 -1.19 0.23297 #&gt; as.factor(education)2 -0.098320 0.190655 -0.52 0.60607 #&gt; as.factor(education)3 0.015699 0.170714 0.09 0.92673 #&gt; as.factor(education)4 -0.042526 0.264276 -0.16 0.87216 #&gt; as.factor(education)5 0.379663 0.220395 1.72 0.08495 . #&gt; smokeintensity -0.065156 0.014759 -4.41 1.0e-05 *** #&gt; I(smokeintensity^2) 0.000846 0.000276 3.07 0.00216 ** #&gt; smokeyrs -0.073371 0.026996 -2.72 0.00657 ** #&gt; I(smokeyrs^2) 0.000838 0.000443 1.89 0.05867 . #&gt; as.factor(exercise)1 0.291412 0.173554 1.68 0.09314 . #&gt; as.factor(exercise)2 0.355052 0.179929 1.97 0.04846 * #&gt; as.factor(active)1 0.010875 0.129832 0.08 0.93324 #&gt; as.factor(active)2 0.068312 0.208727 0.33 0.74346 #&gt; wt71 -0.012848 0.022283 -0.58 0.56423 #&gt; I(wt71^2) 0.000121 0.000135 0.89 0.37096 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1766.7 on 1610 degrees of freedom #&gt; AIC: 1805 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights for A numer.fit &lt;- glm(qsmk ~ 1, family = binomial(), data = nhefs) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.0318 0.0563 -18.3 &lt;2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1876.3 on 1628 degrees of freedom #&gt; AIC: 1878 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) # estimation of denominator of ip weights for C denom.cens &lt;- glm( cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs ) summary(denom.cens) #&gt; #&gt; Call: #&gt; glm(formula = cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + #&gt; age + I(age^2) + as.factor(education) + smokeintensity + #&gt; I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71^2), family = binomial(), #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 4.014466 2.576106 1.56 0.1192 #&gt; as.factor(qsmk)1 0.516867 0.287716 1.80 0.0724 . #&gt; as.factor(sex)1 0.057313 0.330278 0.17 0.8622 #&gt; as.factor(race)1 -0.012271 0.452489 -0.03 0.9784 #&gt; age -0.269729 0.117465 -2.30 0.0217 * #&gt; I(age^2) 0.002884 0.001114 2.59 0.0096 ** #&gt; as.factor(education)2 -0.440788 0.419399 -1.05 0.2933 #&gt; as.factor(education)3 -0.164688 0.370547 -0.44 0.6567 #&gt; as.factor(education)4 0.138447 0.569797 0.24 0.8080 #&gt; as.factor(education)5 -0.382382 0.560181 -0.68 0.4949 #&gt; smokeintensity 0.015712 0.034732 0.45 0.6510 #&gt; I(smokeintensity^2) -0.000113 0.000606 -0.19 0.8517 #&gt; smokeyrs 0.078597 0.074958 1.05 0.2944 #&gt; I(smokeyrs^2) -0.000557 0.001032 -0.54 0.5894 #&gt; as.factor(exercise)1 -0.971471 0.387810 -2.51 0.0122 * #&gt; as.factor(exercise)2 -0.583989 0.372313 -1.57 0.1168 #&gt; as.factor(active)1 -0.247479 0.325455 -0.76 0.4470 #&gt; as.factor(active)2 0.706583 0.396458 1.78 0.0747 . #&gt; wt71 -0.087887 0.040012 -2.20 0.0281 * #&gt; I(wt71^2) 0.000635 0.000226 2.81 0.0049 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 465.36 on 1609 degrees of freedom #&gt; AIC: 505.4 #&gt; #&gt; Number of Fisher Scoring iterations: 7 pd.cens &lt;- 1 - predict(denom.cens, type = &quot;response&quot;) # estimation of numerator of ip weights for C numer.cens &lt;- glm(cens ~ as.factor(qsmk), family = binomial(), data = nhefs) summary(numer.cens) #&gt; #&gt; Call: #&gt; glm(formula = cens ~ as.factor(qsmk), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -3.421 0.165 -20.75 &lt;2e-16 *** #&gt; as.factor(qsmk)1 0.641 0.264 2.43 0.015 * #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 527.76 on 1627 degrees of freedom #&gt; AIC: 531.8 #&gt; #&gt; Number of Fisher Scoring iterations: 6 pn.cens &lt;- 1 - predict(numer.cens, type = &quot;response&quot;) nhefs$sw.a &lt;- ifelse(nhefs$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) nhefs$sw.c &lt;- pn.cens / pd.cens nhefs$sw &lt;- nhefs$sw.c * nhefs$sw.a summary(nhefs$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.33 0.86 0.95 1.00 1.08 4.21 sd(nhefs$sw.a) #&gt; [1] 0.284 summary(nhefs$sw.c) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.94 0.98 0.99 1.01 1.01 7.58 sd(nhefs$sw.c) #&gt; [1] 0.178 summary(nhefs$sw) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.35 0.86 0.94 1.01 1.08 12.86 sd(nhefs$sw) #&gt; [1] 0.411 msm.sw &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs, weights = sw, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs, weights = sw, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.662 0.233 51.0 9.3e-13 *** #&gt; qsmk 3.496 0.526 44.2 2.9e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 61.8 3.83 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.sw) SE &lt;- coef(summary(msm.sw))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.66 1.21 2.12 #&gt; qsmk 3.50 2.47 4.53 "],["standardization-and-the-parametric-g-formula.html", "13. Standardization and the parametric G-formula Program 13.1 Program 13.2 Program 13.3 Program 13.4", " 13. Standardization and the parametric G-formula Program 13.1 Estimating the mean outcome within levels of treatment and confounders Data from NHEFS library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) fit &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, data = nhefs ) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; qsmk:smokeintensity 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 nhefs$predicted.meanY &lt;- predict(fit, nhefs) nhefs[which(nhefs$seqn == 24770), c( &quot;predicted.meanY&quot;, &quot;qsmk&quot;, &quot;sex&quot;, &quot;race&quot;, &quot;age&quot;, &quot;education&quot;, &quot;smokeintensity&quot;, &quot;smokeyrs&quot;, &quot;exercise&quot;, &quot;active&quot;, &quot;wt71&quot; )] #&gt; # A tibble: 1 × 11 #&gt; predicted.meanY qsmk sex race age education smokeintensity smokeyrs #&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; #&gt; 1 0.342 0 0 0 26 4 15 12 #&gt; # ℹ 3 more variables: exercise &lt;dbl&gt;, active &lt;dbl&gt;, wt71 &lt;dbl&gt; summary(nhefs$predicted.meanY[nhefs$cens == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -10.876 1.116 3.042 2.638 4.511 9.876 summary(nhefs$wt82_71[nhefs$cens == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -41.280 -1.478 2.604 2.638 6.690 48.538 Program 13.2 Standardizing the mean outcome to the baseline confounders Data from Table 2.2 id &lt;- c( &quot;Rheia&quot;, &quot;Kronos&quot;, &quot;Demeter&quot;, &quot;Hades&quot;, &quot;Hestia&quot;, &quot;Poseidon&quot;, &quot;Hera&quot;, &quot;Zeus&quot;, &quot;Artemis&quot;, &quot;Apollo&quot;, &quot;Leto&quot;, &quot;Ares&quot;, &quot;Athena&quot;, &quot;Hephaestus&quot;, &quot;Aphrodite&quot;, &quot;Cyclope&quot;, &quot;Persephone&quot;, &quot;Hermes&quot;, &quot;Hebe&quot;, &quot;Dionysus&quot; ) N &lt;- length(id) L &lt;- c(0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1) A &lt;- c(0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1) Y &lt;- c(0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0) interv &lt;- rep(-1, N) observed &lt;- cbind(L, A, Y, interv) untreated &lt;- cbind(L, rep(0, N), rep(NA, N), rep(0, N)) treated &lt;- cbind(L, rep(1, N), rep(NA, N), rep(1, N)) table22 &lt;- as.data.frame(rbind(observed, untreated, treated)) table22$id &lt;- rep(id, 3) glm.obj &lt;- glm(Y ~ A * L, data = table22) summary(glm.obj) #&gt; #&gt; Call: #&gt; glm(formula = Y ~ A * L, data = table22) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 2.500e-01 2.552e-01 0.980 0.342 #&gt; A 3.957e-17 3.608e-01 0.000 1.000 #&gt; L 4.167e-01 3.898e-01 1.069 0.301 #&gt; A:L -1.313e-16 4.959e-01 0.000 1.000 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 0.2604167) #&gt; #&gt; Null deviance: 5.0000 on 19 degrees of freedom #&gt; Residual deviance: 4.1667 on 16 degrees of freedom #&gt; (40 observations deleted due to missingness) #&gt; AIC: 35.385 #&gt; #&gt; Number of Fisher Scoring iterations: 2 table22$predicted.meanY &lt;- predict(glm.obj, table22) mean(table22$predicted.meanY[table22$interv == -1]) #&gt; [1] 0.5 mean(table22$predicted.meanY[table22$interv == 0]) #&gt; [1] 0.5 mean(table22$predicted.meanY[table22$interv == 1]) #&gt; [1] 0.5 Program 13.3 Standardizing the mean outcome to the baseline confounders: Data from NHEFS # create a dataset with 3 copies of each subject nhefs$interv &lt;- -1 # 1st copy: equal to original one interv0 &lt;- nhefs # 2nd copy: treatment set to 0, outcome to missing interv0$interv &lt;- 0 interv0$qsmk &lt;- 0 interv0$wt82_71 &lt;- NA interv1 &lt;- nhefs # 3rd copy: treatment set to 1, outcome to missing interv1$interv &lt;- 1 interv1$qsmk &lt;- 1 interv1$wt82_71 &lt;- NA onesample &lt;- rbind(nhefs, interv0, interv1) # combining datasets # linear model to estimate mean outcome conditional on treatment and confounders # parameters are estimated using original observations only (nhefs) # parameter estimates are used to predict mean outcome for observations with # treatment set to 0 (interv=0) and to 1 (interv=1) std &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), data = onesample ) summary(std) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = onesample) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; I(qsmk * smokeintensity) 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (3321 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 onesample$predicted_meanY &lt;- predict(std, onesample) # estimate mean outcome in each of the groups interv=0, and interv=1 # this mean outcome is a weighted average of the mean outcomes in each combination # of values of treatment and confounders, that is, the standardized outcome mean(onesample[which(onesample$interv == -1), ]$predicted_meanY) #&gt; [1] 2.56319 mean(onesample[which(onesample$interv == 0), ]$predicted_meanY) #&gt; [1] 1.660267 mean(onesample[which(onesample$interv == 1), ]$predicted_meanY) #&gt; [1] 5.178841 Program 13.4 Computing the 95% confidence interval of the standardized means and their difference Data from NHEFS #install.packages(&quot;boot&quot;) # install package if required library(boot) # function to calculate difference in means standardization &lt;- function(data, indices) { # create a dataset with 3 copies of each subject d &lt;- data[indices, ] # 1st copy: equal to original one` d$interv &lt;- -1 d0 &lt;- d # 2nd copy: treatment set to 0, outcome to missing d0$interv &lt;- 0 d0$qsmk &lt;- 0 d0$wt82_71 &lt;- NA d1 &lt;- d # 3rd copy: treatment set to 1, outcome to missing d1$interv &lt;- 1 d1$qsmk &lt;- 1 d1$wt82_71 &lt;- NA d.onesample &lt;- rbind(d, d0, d1) # combining datasets # linear model to estimate mean outcome conditional on treatment and confounders # parameters are estimated using original observations only (interv= -1) # parameter estimates are used to predict mean outcome for observations with set # treatment (interv=0 and interv=1) fit &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71), data = d.onesample ) d.onesample$predicted_meanY &lt;- predict(fit, d.onesample) # estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1 return(c( mean(d.onesample$predicted_meanY[d.onesample$interv == -1]), mean(d.onesample$predicted_meanY[d.onesample$interv == 0]), mean(d.onesample$predicted_meanY[d.onesample$interv == 1]), mean(d.onesample$predicted_meanY[d.onesample$interv == 1]) - mean(d.onesample$predicted_meanY[d.onesample$interv == 0]) )) } # bootstrap results &lt;- boot(data = nhefs, statistic = standardization, R = 5) # generating confidence intervals se &lt;- c(sd(results$t[, 1]), sd(results$t[, 2]), sd(results$t[, 3]), sd(results$t[, 4])) mean &lt;- results$t0 ll &lt;- mean - qnorm(0.975) * se ul &lt;- mean + qnorm(0.975) * se bootstrap &lt;- data.frame(cbind( c( &quot;Observed&quot;, &quot;No Treatment&quot;, &quot;Treatment&quot;, &quot;Treatment - No Treatment&quot; ), mean, se, ll, ul )) bootstrap #&gt; V1 mean se ll #&gt; 1 Observed 2.56188497106099 0.0984024612972166 2.36901969092835 #&gt; 2 No Treatment 1.65212306626744 0.212209617046544 1.23619985968317 #&gt; 3 Treatment 5.11474489549336 0.641158250090791 3.85809781692468 #&gt; 4 Treatment - No Treatment 3.46262182922592 0.828981620853456 1.83784770850751 #&gt; ul #&gt; 1 2.75475025119363 #&gt; 2 2.0680462728517 #&gt; 3 6.37139197406203 #&gt; 4 5.08739594994433 "],["g-estimation-of-structural-nested-models.html", "14. G-estimation of Structural Nested Models Program 14.1 Program 14.2 Program 14.3", " 14. G-estimation of Structural Nested Models Program 14.1 Preprocessing, ranks of extreme observations, IP weights for censoring Data from NHEFS library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some processing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # ranking of extreme observations #install.packages(&quot;Hmisc&quot;) library(Hmisc) #&gt; #&gt; Attaching package: &#39;Hmisc&#39; #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; format.pval, units describe(nhefs$wt82_71) #&gt; nhefs$wt82_71 #&gt; n missing distinct Info Mean Gmd .05 .10 #&gt; 1566 63 1510 1 2.638 8.337 -9.752 -6.292 #&gt; .25 .50 .75 .90 .95 #&gt; -1.478 2.604 6.690 11.117 14.739 #&gt; #&gt; lowest : -41.2805 -30.5019 -30.0501 -29.0258 -25.9706 #&gt; highest: 34.0178 36.9693 37.6505 47.5113 48.5384 # estimation of denominator of ip weights for C cw.denom &lt;- glm(cens==0 ~ qsmk + sex + race + age + I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), data = nhefs, family = binomial(&quot;logit&quot;)) summary(cw.denom) #&gt; #&gt; Call: #&gt; glm(formula = cens == 0 ~ qsmk + sex + race + age + I(age^2) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(&quot;logit&quot;), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -4.0144661 2.5761058 -1.558 0.11915 #&gt; qsmk -0.5168674 0.2877162 -1.796 0.07242 . #&gt; sex -0.0573131 0.3302775 -0.174 0.86223 #&gt; race 0.0122715 0.4524887 0.027 0.97836 #&gt; age 0.2697293 0.1174647 2.296 0.02166 * #&gt; I(age^2) -0.0028837 0.0011135 -2.590 0.00961 ** #&gt; as.factor(education)2 0.4407884 0.4193993 1.051 0.29326 #&gt; as.factor(education)3 0.1646881 0.3705471 0.444 0.65672 #&gt; as.factor(education)4 -0.1384470 0.5697969 -0.243 0.80802 #&gt; as.factor(education)5 0.3823818 0.5601808 0.683 0.49486 #&gt; smokeintensity -0.0157119 0.0347319 -0.452 0.65100 #&gt; I(smokeintensity^2) 0.0001133 0.0006058 0.187 0.85171 #&gt; smokeyrs -0.0785973 0.0749576 -1.049 0.29438 #&gt; I(smokeyrs^2) 0.0005569 0.0010318 0.540 0.58938 #&gt; as.factor(exercise)1 0.9714714 0.3878101 2.505 0.01224 * #&gt; as.factor(exercise)2 0.5839890 0.3723133 1.569 0.11675 #&gt; as.factor(active)1 0.2474785 0.3254548 0.760 0.44701 #&gt; as.factor(active)2 -0.7065829 0.3964577 -1.782 0.07471 . #&gt; wt71 0.0878871 0.0400115 2.197 0.02805 * #&gt; I(wt71^2) -0.0006351 0.0002257 -2.813 0.00490 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 465.36 on 1609 degrees of freedom #&gt; AIC: 505.36 #&gt; #&gt; Number of Fisher Scoring iterations: 7 nhefs$pd.c &lt;- predict(cw.denom, nhefs, type=&quot;response&quot;) nhefs$wc &lt;- ifelse(nhefs$cens==0, 1/nhefs$pd.c, NA) # observations with cens=1 only contribute to censoring models Program 14.2 G-estimation of a 1-parameter structural nested mean model Brute force search Data from NHEFS G-estimation: Checking one possible value of psi #install.packages(&quot;geepack&quot;) library(&quot;geepack&quot;) nhefs$psi &lt;- 3.446 nhefs$Hpsi &lt;- nhefs$wt82_71 - nhefs$psi*nhefs$qsmk fit &lt;- geeglm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + Hpsi, family=binomial, data=nhefs, weights=wc, id=seqn, corstr=&quot;independence&quot;) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(fit) #&gt; #&gt; Call: #&gt; geeglm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + #&gt; I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71 * wt71) + Hpsi, family = binomial, data = nhefs, #&gt; weights = wc, id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) -2.403e+00 1.329e+00 3.269 0.070604 . #&gt; sex -5.137e-01 1.536e-01 11.193 0.000821 *** #&gt; race -8.609e-01 2.099e-01 16.826 4.10e-05 *** #&gt; age 1.152e-01 5.020e-02 5.263 0.021779 * #&gt; I(age * age) -7.593e-04 5.296e-04 2.056 0.151619 #&gt; as.factor(education)2 -2.894e-02 1.964e-01 0.022 0.882859 #&gt; as.factor(education)3 8.771e-02 1.726e-01 0.258 0.611329 #&gt; as.factor(education)4 6.637e-02 2.698e-01 0.061 0.805645 #&gt; as.factor(education)5 4.711e-01 2.247e-01 4.395 0.036036 * #&gt; smokeintensity -7.834e-02 1.464e-02 28.635 8.74e-08 *** #&gt; I(smokeintensity * smokeintensity) 1.072e-03 2.650e-04 16.368 5.21e-05 *** #&gt; smokeyrs -7.111e-02 2.639e-02 7.261 0.007047 ** #&gt; I(smokeyrs * smokeyrs) 8.153e-04 4.490e-04 3.298 0.069384 . #&gt; as.factor(exercise)1 3.363e-01 1.828e-01 3.384 0.065844 . #&gt; as.factor(exercise)2 3.800e-01 1.889e-01 4.049 0.044187 * #&gt; as.factor(active)1 3.412e-02 1.339e-01 0.065 0.798778 #&gt; as.factor(active)2 2.135e-01 2.121e-01 1.012 0.314308 #&gt; wt71 -7.661e-03 2.562e-02 0.089 0.764963 #&gt; I(wt71 * wt71) 8.655e-05 1.582e-04 0.299 0.584233 #&gt; Hpsi -1.903e-06 8.839e-03 0.000 0.999828 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 0.9969 0.06717 #&gt; Number of clusters: 1566 Maximum cluster size: 1 G-estimation: Checking multiple possible values of psi #install.packages(&quot;geepack&quot;) grid &lt;- seq(from = 2,to = 5, by = 0.1) j = 0 Hpsi.coefs &lt;- cbind(rep(NA,length(grid)), rep(NA, length(grid))) colnames(Hpsi.coefs) &lt;- c(&quot;Estimate&quot;, &quot;p-value&quot;) for (i in grid){ psi = i j = j+1 nhefs$Hpsi &lt;- nhefs$wt82_71 - psi * nhefs$qsmk gest.fit &lt;- geeglm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + Hpsi, family=binomial, data=nhefs, weights=wc, id=seqn, corstr=&quot;independence&quot;) Hpsi.coefs[j,1] &lt;- summary(gest.fit)$coefficients[&quot;Hpsi&quot;, &quot;Estimate&quot;] Hpsi.coefs[j,2] &lt;- summary(gest.fit)$coefficients[&quot;Hpsi&quot;, &quot;Pr(&gt;|W|)&quot;] } #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! Hpsi.coefs #&gt; Estimate p-value #&gt; [1,] 0.0267219 0.001772 #&gt; [2,] 0.0248946 0.003580 #&gt; [3,] 0.0230655 0.006963 #&gt; [4,] 0.0212344 0.013026 #&gt; [5,] 0.0194009 0.023417 #&gt; [6,] 0.0175647 0.040430 #&gt; [7,] 0.0157254 0.067015 #&gt; [8,] 0.0138827 0.106626 #&gt; [9,] 0.0120362 0.162877 #&gt; [10,] 0.0101857 0.238979 #&gt; [11,] 0.0083308 0.337048 #&gt; [12,] 0.0064713 0.457433 #&gt; [13,] 0.0046069 0.598235 #&gt; [14,] 0.0027374 0.755204 #&gt; [15,] 0.0008624 0.922101 #&gt; [16,] -0.0010181 0.908537 #&gt; [17,] -0.0029044 0.744362 #&gt; [18,] -0.0047967 0.592188 #&gt; [19,] -0.0066950 0.457169 #&gt; [20,] -0.0085997 0.342360 #&gt; [21,] -0.0105107 0.248681 #&gt; [22,] -0.0124282 0.175239 #&gt; [23,] -0.0143523 0.119841 #&gt; [24,] -0.0162831 0.079580 #&gt; [25,] -0.0182206 0.051347 #&gt; [26,] -0.0201649 0.032218 #&gt; [27,] -0.0221160 0.019675 #&gt; [28,] -0.0240740 0.011706 #&gt; [29,] -0.0260389 0.006792 #&gt; [30,] -0.0280106 0.003847 #&gt; [31,] -0.0299893 0.002129 Program 14.3 G-estimation for 2-parameter structural nested mean model Closed form estimator Data from NHEFS G-estimation: Closed form estimator linear mean models logit.est &lt;- glm(qsmk ~ sex + race + age + I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), data = nhefs, weight = wc, family = binomial()) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(logit.est) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + #&gt; as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), #&gt; family = binomial(), data = nhefs, weights = wc) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.40e+00 1.31e+00 -1.83 0.06743 . #&gt; sex -5.14e-01 1.50e-01 -3.42 0.00062 *** #&gt; race -8.61e-01 2.06e-01 -4.18 2.9e-05 *** #&gt; age 1.15e-01 4.95e-02 2.33 0.01992 * #&gt; I(age^2) -7.59e-04 5.14e-04 -1.48 0.13953 #&gt; as.factor(education)2 -2.89e-02 1.93e-01 -0.15 0.88079 #&gt; as.factor(education)3 8.77e-02 1.73e-01 0.51 0.61244 #&gt; as.factor(education)4 6.64e-02 2.66e-01 0.25 0.80301 #&gt; as.factor(education)5 4.71e-01 2.21e-01 2.13 0.03314 * #&gt; smokeintensity -7.83e-02 1.49e-02 -5.27 1.4e-07 *** #&gt; I(smokeintensity^2) 1.07e-03 2.78e-04 3.85 0.00012 *** #&gt; smokeyrs -7.11e-02 2.71e-02 -2.63 0.00862 ** #&gt; I(smokeyrs^2) 8.15e-04 4.45e-04 1.83 0.06722 . #&gt; as.factor(exercise)1 3.36e-01 1.75e-01 1.92 0.05467 . #&gt; as.factor(exercise)2 3.80e-01 1.82e-01 2.09 0.03637 * #&gt; as.factor(active)1 3.41e-02 1.30e-01 0.26 0.79337 #&gt; as.factor(active)2 2.13e-01 2.06e-01 1.04 0.30033 #&gt; wt71 -7.66e-03 2.46e-02 -0.31 0.75530 #&gt; I(wt71^2) 8.66e-05 1.51e-04 0.57 0.56586 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1872.2 on 1565 degrees of freedom #&gt; Residual deviance: 1755.6 on 1547 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 1719 #&gt; #&gt; Number of Fisher Scoring iterations: 4 nhefs$pqsmk &lt;- predict(logit.est, nhefs, type = &quot;response&quot;) describe(nhefs$pqsmk) #&gt; nhefs$pqsmk #&gt; n missing distinct Info Mean Gmd .05 .10 #&gt; 1629 0 1629 1 0.2622 0.1302 0.1015 0.1261 #&gt; .25 .50 .75 .90 .95 #&gt; 0.1780 0.2426 0.3251 0.4221 0.4965 #&gt; #&gt; lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059 #&gt; highest: 0.672083 0.686432 0.713913 0.733299 0.78914 summary(nhefs$pqsmk) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.0514 0.1780 0.2426 0.2622 0.3251 0.7891 # solve sum(w_c * H(psi) * (qsmk - E[qsmk | L])) = 0 # for a single psi and H(psi) = wt82_71 - psi * qsmk # this can be solved as # psi = sum( w_c * wt82_71 * (qsmk - pqsmk)) / sum(w_c * qsmk * (qsmk - pqsmk)) nhefs.c &lt;- nhefs[which(!is.na(nhefs$wt82)),] with(nhefs.c, sum(wc*wt82_71*(qsmk-pqsmk)) / sum(wc*qsmk*(qsmk - pqsmk))) #&gt; [1] 3.446 G-estimation: Closed form estimator for 2-parameter model diff = with(nhefs.c, qsmk - pqsmk) diff2 = with(nhefs.c, wc * diff) lhs = matrix(0,2,2) lhs[1,1] = with(nhefs.c, sum(qsmk * diff2)) lhs[1,2] = with(nhefs.c, sum(qsmk * smokeintensity * diff2)) lhs[2,1] = with(nhefs.c, sum(qsmk * smokeintensity * diff2)) lhs[2,2] = with(nhefs.c, sum(qsmk * smokeintensity * smokeintensity * diff2)) rhs = matrix(0,2,1) rhs[1] = with(nhefs.c, sum(wt82_71 * diff2)) rhs[2] = with(nhefs.c, sum(wt82_71 * smokeintensity * diff2)) psi = t(solve(lhs,rhs)) psi #&gt; [,1] [,2] #&gt; [1,] 2.859 0.03004 "],["outcome-regression-and-propensity-scores.html", "15. Outcome regression and propensity scores Program 15.1 Program 15.2 Program 15.3 Program 15.4", " 15. Outcome regression and propensity scores Program 15.1 Estimating the average causal effect within levels of confounders under the assumption of effect-measure modification by smoking intensity ONLY Data from NHEFS library(here) #install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # regression on covariates, allowing for some effect modification fit &lt;- glm(wt82_71 ~ qsmk + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + I(qsmk*smokeintensity), data=nhefs) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; I(qsmk * smokeintensity) 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 # (step 1) build the contrast matrix with all zeros # this function builds the blank matrix # install.packages(&quot;multcomp&quot;) # install packages if necessary library(&quot;multcomp&quot;) #&gt; Loading required package: mvtnorm #&gt; Loading required package: survival #&gt; Loading required package: TH.data #&gt; Loading required package: MASS #&gt; #&gt; Attaching package: &#39;TH.data&#39; #&gt; The following object is masked from &#39;package:MASS&#39;: #&gt; #&gt; geyser makeContrastMatrix &lt;- function(model, nrow, names) { m &lt;- matrix(0, nrow = nrow, ncol = length(coef(model))) colnames(m) &lt;- names(coef(model)) rownames(m) &lt;- names return(m) } K1 &lt;- makeContrastMatrix( fit, 2, c( &#39;Effect of Quitting Smoking at Smokeintensity of 5&#39;, &#39;Effect of Quitting Smoking at Smokeintensity of 40&#39; ) ) # (step 2) fill in the relevant non-zero elements K1[1:2, &#39;qsmk&#39;] &lt;- 1 K1[1:2, &#39;I(qsmk * smokeintensity)&#39;] &lt;- c(5, 40) # (step 3) check the contrast matrix K1 #&gt; (Intercept) qsmk sex race #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 1 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 1 0 0 #&gt; age I(age * age) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 0 #&gt; as.factor(education)2 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)3 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)4 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)5 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; smokeintensity #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(smokeintensity * smokeintensity) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; smokeyrs #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(smokeyrs * smokeyrs) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(exercise)1 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(exercise)2 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(active)1 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(active)2 wt71 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 0 #&gt; I(wt71 * wt71) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(qsmk * smokeintensity) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 5 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 40 # (step 4) estimate the contrasts, get tests and confidence intervals for them estimates1 &lt;- glht(fit, K1) summary(estimates1) #&gt; #&gt; Simultaneous Tests for General Linear Hypotheses #&gt; #&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Linear Hypotheses: #&gt; Estimate Std. Error #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 2.7929 0.6683 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261 0.8478 #&gt; z value Pr(&gt;|z|) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 4.179 5.84e-05 *** #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 5.221 3.56e-07 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; (Adjusted p values reported -- single-step method) confint(estimates1) #&gt; #&gt; Simultaneous Confidence Intervals #&gt; #&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Quantile = 2.2281 #&gt; 95% family-wise confidence level #&gt; #&gt; #&gt; Linear Hypotheses: #&gt; Estimate lwr upr #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 2.7929 1.3039 4.2819 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261 2.5372 6.3151 # regression on covariates, not allowing for effect modification fit2 &lt;- glm(wt82_71 ~ qsmk + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs) summary(fit2) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.6586176 4.3137734 -0.384 0.700666 #&gt; qsmk 3.4626218 0.4384543 7.897 5.36e-15 *** #&gt; sex -1.4650496 0.4683410 -3.128 0.001792 ** #&gt; race 0.5864117 0.5816949 1.008 0.313560 #&gt; age 0.3626624 0.1633431 2.220 0.026546 * #&gt; I(age * age) -0.0061377 0.0017263 -3.555 0.000389 *** #&gt; as.factor(education)2 0.8185263 0.6067815 1.349 0.177546 #&gt; as.factor(education)3 0.5715004 0.5561211 1.028 0.304273 #&gt; as.factor(education)4 1.5085173 0.8323778 1.812 0.070134 . #&gt; as.factor(education)5 -0.1708264 0.7413289 -0.230 0.817786 #&gt; smokeintensity 0.0651533 0.0503115 1.295 0.195514 #&gt; I(smokeintensity * smokeintensity) -0.0010468 0.0009373 -1.117 0.264261 #&gt; smokeyrs 0.1333931 0.0917319 1.454 0.146104 #&gt; I(smokeyrs * smokeyrs) -0.0018270 0.0015438 -1.183 0.236818 #&gt; as.factor(exercise)1 0.3206824 0.5349616 0.599 0.548961 #&gt; as.factor(exercise)2 0.3628786 0.5589557 0.649 0.516300 #&gt; as.factor(active)1 -0.9429574 0.4100208 -2.300 0.021593 * #&gt; as.factor(active)2 -0.2580374 0.6847219 -0.377 0.706337 #&gt; wt71 0.0373642 0.0831658 0.449 0.653297 #&gt; I(wt71 * wt71) -0.0009158 0.0005235 -1.749 0.080426 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.59474) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82857 on 1546 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 Program 15.2 Estimating and plotting the propensity score Data from NHEFS fit3 &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) summary(fit3) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + #&gt; I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71 * wt71), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.9889022 1.2412792 -1.602 0.109089 #&gt; sex -0.5075218 0.1482316 -3.424 0.000617 *** #&gt; race -0.8502312 0.2058720 -4.130 3.63e-05 *** #&gt; age 0.1030132 0.0488996 2.107 0.035150 * #&gt; I(age * age) -0.0006052 0.0005074 -1.193 0.232973 #&gt; as.factor(education)2 -0.0983203 0.1906553 -0.516 0.606066 #&gt; as.factor(education)3 0.0156987 0.1707139 0.092 0.926730 #&gt; as.factor(education)4 -0.0425260 0.2642761 -0.161 0.872160 #&gt; as.factor(education)5 0.3796632 0.2203947 1.723 0.084952 . #&gt; smokeintensity -0.0651561 0.0147589 -4.415 1.01e-05 *** #&gt; I(smokeintensity * smokeintensity) 0.0008461 0.0002758 3.067 0.002160 ** #&gt; smokeyrs -0.0733708 0.0269958 -2.718 0.006571 ** #&gt; I(smokeyrs * smokeyrs) 0.0008384 0.0004435 1.891 0.058669 . #&gt; as.factor(exercise)1 0.2914117 0.1735543 1.679 0.093136 . #&gt; as.factor(exercise)2 0.3550517 0.1799293 1.973 0.048463 * #&gt; as.factor(active)1 0.0108754 0.1298320 0.084 0.933243 #&gt; as.factor(active)2 0.0683123 0.2087269 0.327 0.743455 #&gt; wt71 -0.0128478 0.0222829 -0.577 0.564226 #&gt; I(wt71 * wt71) 0.0001209 0.0001352 0.895 0.370957 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1766.7 on 1610 degrees of freedom #&gt; AIC: 1804.7 #&gt; #&gt; Number of Fisher Scoring iterations: 4 nhefs$ps &lt;- predict(fit3, nhefs, type=&quot;response&quot;) summary(nhefs$ps[nhefs$qsmk==0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788 summary(nhefs$ps[nhefs$qsmk==1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320 # # plotting the estimated propensity score # install.packages(&quot;ggplot2&quot;) # install packages if necessary # install.packages(&quot;dplyr&quot;) library(&quot;ggplot2&quot;) library(&quot;dplyr&quot;) #&gt; #&gt; Attaching package: &#39;dplyr&#39; #&gt; The following object is masked from &#39;package:MASS&#39;: #&gt; #&gt; select #&gt; The following objects are masked from &#39;package:stats&#39;: #&gt; #&gt; filter, lag #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; intersect, setdiff, setequal, union ggplot(nhefs, aes(x = ps, fill = qsmk)) + geom_density(alpha = 0.2) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;) #&gt; Warning: The following aesthetics were dropped during statistical transformation: fill. #&gt; ℹ This can happen when ggplot fails to infer the correct grouping structure in #&gt; the data. #&gt; ℹ Did you forget to specify a `group` aesthetic or to convert a numerical #&gt; variable into a factor? # alternative plot with histograms nhefs &lt;- nhefs %&gt;% mutate(qsmklabel = ifelse(qsmk == 1, yes = &#39;Quit Smoking 1971-1982&#39;, no = &#39;Did Not Quit Smoking 1971-1982&#39;)) ggplot(nhefs, aes(x = ps, fill = as.factor(qsmk), color = as.factor(qsmk))) + geom_histogram(alpha = 0.3, position = &#39;identity&#39;, bins=15) + facet_grid(as.factor(qsmk) ~ .) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + scale_color_discrete(&#39;&#39;) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;) # attempt to reproduce plot from the book nhefs %&gt;% mutate(ps.grp = round(ps/0.05) * 0.05) %&gt;% group_by(qsmk, ps.grp) %&gt;% summarize(n = n()) %&gt;% ungroup() %&gt;% mutate(n2 = ifelse(qsmk == 0, yes = n, no = -1*n)) %&gt;% ggplot(aes(x = ps.grp, y = n2, fill = as.factor(qsmk))) + geom_bar(stat = &#39;identity&#39;, position = &#39;identity&#39;) + geom_text(aes(label = n, x = ps.grp, y = n2 + ifelse(qsmk == 0, 8, -8))) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ylab(&#39;N&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + scale_x_continuous(breaks = seq(0, 1, 0.05)) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;, axis.ticks.y = element_blank(), axis.text.y = element_blank()) Program 15.3 Stratification on the propensity score Data from NHEFS # calculation of deciles nhefs$ps.dec &lt;- cut(nhefs$ps, breaks=c(quantile(nhefs$ps, probs=seq(0,1,0.1))), labels=seq(1:10), include.lowest=TRUE) #install.packages(&quot;psych&quot;) # install package if required library(&quot;psych&quot;) #&gt; #&gt; Attaching package: &#39;psych&#39; #&gt; The following objects are masked from &#39;package:ggplot2&#39;: #&gt; #&gt; %+%, alpha describeBy(nhefs$ps, list(nhefs$ps.dec, nhefs$qsmk)) #&gt; #&gt; Descriptive statistics by group #&gt; : 1 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 151 0.1 0.02 0.11 0.1 0.02 0.05 0.13 0.08 -0.55 -0.53 0 #&gt; ------------------------------------------------------------ #&gt; : 2 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 136 0.15 0.01 0.15 0.15 0.01 0.13 0.17 0.04 -0.04 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 3 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 134 0.18 0.01 0.18 0.18 0.01 0.17 0.19 0.03 -0.08 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 4 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 129 0.21 0.01 0.21 0.21 0.01 0.19 0.22 0.02 -0.04 -1.13 0 #&gt; ------------------------------------------------------------ #&gt; : 5 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 120 0.23 0.01 0.23 0.23 0.01 0.22 0.25 0.03 0.24 -1.22 0 #&gt; ------------------------------------------------------------ #&gt; : 6 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 117 0.26 0.01 0.26 0.26 0.01 0.25 0.27 0.03 -0.11 -1.29 0 #&gt; ------------------------------------------------------------ #&gt; : 7 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 120 0.29 0.01 0.29 0.29 0.01 0.27 0.31 0.03 -0.23 -1.19 0 #&gt; ------------------------------------------------------------ #&gt; : 8 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 112 0.33 0.01 0.33 0.33 0.02 0.31 0.35 0.04 0.15 -1.1 0 #&gt; ------------------------------------------------------------ #&gt; : 9 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 96 0.38 0.02 0.38 0.38 0.02 0.35 0.42 0.06 0.13 -1.15 0 #&gt; ------------------------------------------------------------ #&gt; : 10 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 86 0.49 0.06 0.47 0.48 0.05 0.42 0.66 0.24 1.1 0.47 0.01 #&gt; ------------------------------------------------------------ #&gt; : 1 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 12 0.1 0.02 0.11 0.1 0.03 0.06 0.13 0.07 -0.5 -1.36 0.01 #&gt; ------------------------------------------------------------ #&gt; : 2 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 27 0.15 0.01 0.15 0.15 0.01 0.13 0.17 0.03 -0.03 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 3 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 29 0.18 0.01 0.18 0.18 0.01 0.17 0.19 0.03 0.01 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 4 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 34 0.21 0.01 0.21 0.21 0.01 0.19 0.22 0.02 -0.31 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 5 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 43 0.23 0.01 0.23 0.23 0.01 0.22 0.25 0.03 0.11 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 6 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 45 0.26 0.01 0.26 0.26 0.01 0.25 0.27 0.03 0.2 -1.12 0 #&gt; ------------------------------------------------------------ #&gt; : 7 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 43 0.29 0.01 0.29 0.29 0.01 0.27 0.31 0.03 0.16 -1.25 0 #&gt; ------------------------------------------------------------ #&gt; : 8 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 51 0.33 0.01 0.33 0.33 0.02 0.31 0.35 0.04 0.11 -1.19 0 #&gt; ------------------------------------------------------------ #&gt; : 9 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 67 0.38 0.02 0.38 0.38 0.03 0.35 0.42 0.06 0.19 -1.27 0 #&gt; ------------------------------------------------------------ #&gt; : 10 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 77 0.52 0.08 0.51 0.51 0.08 0.42 0.79 0.38 0.88 0.81 0.01 # function to create deciles easily decile &lt;- function(x) { return(factor(quantcut(x, seq(0, 1, 0.1), labels = FALSE))) } # regression on PS deciles, allowing for effect modification for (deciles in c(1:10)) { print(t.test(wt82_71~qsmk, data=nhefs[which(nhefs$ps.dec==deciles),])) } #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = 0.0060506, df = 11.571, p-value = 0.9953 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.283903 5.313210 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 3.995205 3.980551 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.1117, df = 37.365, p-value = 0.003556 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.849335 -1.448161 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.904679 7.053426 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -4.5301, df = 35.79, p-value = 6.317e-05 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -9.474961 -3.613990 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.612094 9.156570 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.4117, df = 45.444, p-value = 0.1648 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.6831731 0.9985715 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 3.474679 5.816979 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.1371, df = 74.249, p-value = 0.002446 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.753621 -1.507087 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.098800 6.229154 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -2.1677, df = 50.665, p-value = 0.0349 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -8.7516605 -0.3350127 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 1.847004 6.390340 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.3155, df = 84.724, p-value = 0.001348 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.904207 -1.727590 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 1.560048 5.875946 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -2.664, df = 75.306, p-value = 0.009441 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.2396014 -0.9005605 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 0.2846851 3.8547661 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.9122, df = 129.12, p-value = 0.05806 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -4.68143608 0.07973698 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; -0.8954482 1.4054014 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.5925, df = 142.72, p-value = 0.1135 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.0209284 0.5404697 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; -0.5043766 1.7358528 # regression on PS deciles, not allowing for effect modification fit.psdec &lt;- glm(wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs) summary(fit.psdec) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 3.7505 0.6089 6.159 9.29e-10 *** #&gt; qsmk 3.5005 0.4571 7.659 3.28e-14 *** #&gt; as.factor(ps.dec)2 -0.7391 0.8611 -0.858 0.3908 #&gt; as.factor(ps.dec)3 -0.6182 0.8612 -0.718 0.4730 #&gt; as.factor(ps.dec)4 -0.5204 0.8584 -0.606 0.5444 #&gt; as.factor(ps.dec)5 -1.4884 0.8590 -1.733 0.0834 . #&gt; as.factor(ps.dec)6 -1.6227 0.8675 -1.871 0.0616 . #&gt; as.factor(ps.dec)7 -1.9853 0.8681 -2.287 0.0223 * #&gt; as.factor(ps.dec)8 -3.4447 0.8749 -3.937 8.61e-05 *** #&gt; as.factor(ps.dec)9 -5.1544 0.8848 -5.825 6.91e-09 *** #&gt; as.factor(ps.dec)10 -4.8403 0.8828 -5.483 4.87e-08 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 58.42297) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 90848 on 1555 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10827 #&gt; #&gt; Number of Fisher Scoring iterations: 2 confint.lm(fit.psdec) #&gt; 2.5 % 97.5 % #&gt; (Intercept) 2.556098 4.94486263 #&gt; qsmk 2.603953 4.39700504 #&gt; as.factor(ps.dec)2 -2.428074 0.94982494 #&gt; as.factor(ps.dec)3 -2.307454 1.07103569 #&gt; as.factor(ps.dec)4 -2.204103 1.16333143 #&gt; as.factor(ps.dec)5 -3.173337 0.19657938 #&gt; as.factor(ps.dec)6 -3.324345 0.07893027 #&gt; as.factor(ps.dec)7 -3.688043 -0.28248110 #&gt; as.factor(ps.dec)8 -5.160862 -1.72860113 #&gt; as.factor(ps.dec)9 -6.889923 -3.41883853 #&gt; as.factor(ps.dec)10 -6.571789 -3.10873731 Program 15.4 Standardization using the propensity score Data from NHEFS #install.packages(&quot;boot&quot;) # install package if required library(&quot;boot&quot;) #&gt; #&gt; Attaching package: &#39;boot&#39; #&gt; The following object is masked from &#39;package:psych&#39;: #&gt; #&gt; logit #&gt; The following object is masked from &#39;package:survival&#39;: #&gt; #&gt; aml # standardization by propensity score, agnostic regarding effect modification std.ps &lt;- function(data, indices) { d &lt;- data[indices,] # 1st copy: equal to original one` # calculating propensity scores ps.fit &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=d, family=binomial()) d$pscore &lt;- predict(ps.fit, d, type=&quot;response&quot;) # create a dataset with 3 copies of each subject d$interv &lt;- -1 # 1st copy: equal to original one` d0 &lt;- d # 2nd copy: treatment set to 0, outcome to missing d0$interv &lt;- 0 d0$qsmk &lt;- 0 d0$wt82_71 &lt;- NA d1 &lt;- d # 3rd copy: treatment set to 1, outcome to missing d1$interv &lt;- 1 d1$qsmk &lt;- 1 d1$wt82_71 &lt;- NA d.onesample &lt;- rbind(d, d0, d1) # combining datasets std.fit &lt;- glm(wt82_71 ~ qsmk + pscore + I(qsmk*pscore), data=d.onesample) d.onesample$predicted_meanY &lt;- predict(std.fit, d.onesample) # estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1 return(c(mean(d.onesample$predicted_meanY[d.onesample$interv==-1]), mean(d.onesample$predicted_meanY[d.onesample$interv==0]), mean(d.onesample$predicted_meanY[d.onesample$interv==1]), mean(d.onesample$predicted_meanY[d.onesample$interv==1])- mean(d.onesample$predicted_meanY[d.onesample$interv==0]))) } # bootstrap results &lt;- boot(data=nhefs, statistic=std.ps, R=5) # generating confidence intervals se &lt;- c(sd(results$t[,1]), sd(results$t[,2]), sd(results$t[,3]), sd(results$t[,4])) mean &lt;- results$t0 ll &lt;- mean - qnorm(0.975)*se ul &lt;- mean + qnorm(0.975)*se bootstrap &lt;- data.frame(cbind(c(&quot;Observed&quot;, &quot;No Treatment&quot;, &quot;Treatment&quot;, &quot;Treatment - No Treatment&quot;), mean, se, ll, ul)) bootstrap #&gt; V1 mean se ll #&gt; 1 Observed 2.63384609228479 0.0827987483280176 2.47156352759688 #&gt; 2 No Treatment 1.71983636149845 0.161487941750904 1.40332581172918 #&gt; 3 Treatment 5.35072300362985 0.688985026710106 4.00033716539068 #&gt; 4 Treatment - No Treatment 3.6308866421314 0.822159808859099 2.01948302723123 #&gt; ul #&gt; 1 2.7961286569727 #&gt; 2 2.03634691126773 #&gt; 3 6.70110884186903 #&gt; 4 5.24229025703157 # regression on the propensity score (linear term) model6 &lt;- glm(wt82_71 ~ qsmk + ps, data = nhefs) # p.qsmk summary(model6) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + ps, data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 5.5945 0.4831 11.581 &lt; 2e-16 *** #&gt; qsmk 3.5506 0.4573 7.765 1.47e-14 *** #&gt; ps -14.8218 1.7576 -8.433 &lt; 2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 58.28455) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 91099 on 1563 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10815 #&gt; #&gt; Number of Fisher Scoring iterations: 2 # standarization on the propensity score # (step 1) create two new datasets, one with all treated and one with all untreated treated &lt;- nhefs treated$qsmk &lt;- 1 untreated &lt;- nhefs untreated$qsmk &lt;- 0 # (step 2) predict values for everyone in each new dataset based on above model treated$pred.y &lt;- predict(model6, treated) untreated$pred.y &lt;- predict(model6, untreated) # (step 3) compare mean weight loss had all been treated vs. that had all been untreated mean1 &lt;- mean(treated$pred.y, na.rm = TRUE) mean0 &lt;- mean(untreated$pred.y, na.rm = TRUE) mean1 #&gt; [1] 5.250824 mean0 #&gt; [1] 1.700228 mean1 - mean0 #&gt; [1] 3.550596 # (step 4) bootstrap a confidence interval # number of bootstraps nboot &lt;- 100 # set up a matrix to store results boots &lt;- data.frame(i = 1:nboot, mean1 = NA, mean0 = NA, difference = NA) # loop to perform the bootstrapping nhefs &lt;- subset(nhefs, !is.na(ps) &amp; !is.na(wt82_71)) # p.qsmk for(i in 1:nboot) { # sample with replacement sampl &lt;- nhefs[sample(1:nrow(nhefs), nrow(nhefs), replace = TRUE), ] # fit the model in the bootstrap sample bootmod &lt;- glm(wt82_71 ~ qsmk + ps, data = sampl) # ps # create new datasets sampl.treated &lt;- sampl %&gt;% mutate(qsmk = 1) sampl.untreated &lt;- sampl %&gt;% mutate(qsmk = 0) # predict values sampl.treated$pred.y &lt;- predict(bootmod, sampl.treated) sampl.untreated$pred.y &lt;- predict(bootmod, sampl.untreated) # output results boots[i, &#39;mean1&#39;] &lt;- mean(sampl.treated$pred.y, na.rm = TRUE) boots[i, &#39;mean0&#39;] &lt;- mean(sampl.untreated$pred.y, na.rm = TRUE) boots[i, &#39;difference&#39;] &lt;- boots[i, &#39;mean1&#39;] - boots[i, &#39;mean0&#39;] # once loop is done, print the results if(i == nboot) { cat(&#39;95% CI for the causal mean difference\\n&#39;) cat(mean(boots$difference) - 1.96*sd(boots$difference), &#39;,&#39;, mean(boots$difference) + 1.96*sd(boots$difference)) } } #&gt; 95% CI for the causal mean difference #&gt; 2.723492 , 4.527558 A more flexible and elegant way to do this is to write a function to perform the model fitting, prediction, bootstrapping, and reporting all at once. "],["instrumental-variables-estimation.html", "16. Instrumental variables estimation Program 16.1 Program 16.2 Program 16.3 Program 16.4 Program 16.5", " 16. Instrumental variables estimation Program 16.1 Estimating the average causal using the standard IV estimator via the calculation of sample averages Data from NHEFS library(here) #install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) summary(nhefs$price82) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. NA&#39;s #&gt; 1.452 1.740 1.815 1.806 1.868 2.103 92 # for simplicity, ignore subjects with missing outcome or missing instrument nhefs.iv &lt;- nhefs[which(!is.na(nhefs$wt82) &amp; !is.na(nhefs$price82)),] nhefs.iv$highprice &lt;- ifelse(nhefs.iv$price82&gt;=1.5, 1, 0) table(nhefs.iv$highprice, nhefs.iv$qsmk) #&gt; #&gt; 0 1 #&gt; 0 33 8 #&gt; 1 1065 370 t.test(wt82_71 ~ highprice, data=nhefs.iv) #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by highprice #&gt; t = -0.10179, df = 41.644, p-value = 0.9194 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -3.130588 2.830010 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.535729 2.686018 Program 16.2 Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression Data from NHEFS #install.packages (&quot;sem&quot;) # install package if required library(sem) model1 &lt;- tsls(wt82_71 ~ qsmk, ~ highprice, data = nhefs.iv) summary(model1) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~highprice #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -43.34863 -4.00206 -0.02712 0.00000 4.17040 46.47022 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 2.068164 5.085098 0.40671 0.68428 #&gt; qsmk 2.396270 19.840037 0.12078 0.90388 #&gt; #&gt; Residual standard error: 7.8561141 on 1474 degrees of freedom confint(model1) # note the wide confidence intervals #&gt; 2.5 % 97.5 % #&gt; (Intercept) -7.898445 12.03477 #&gt; qsmk -36.489487 41.28203 Program 16.3 Estimating the average causal using the standard IV estimator via additive marginal structural models Data from NHEFS G-estimation: Checking one possible value of psi See Chapter 14 for program that checks several values and computes 95% confidence intervals nhefs.iv$psi &lt;- 2.396 nhefs.iv$Hpsi &lt;- nhefs.iv$wt82_71-nhefs.iv$psi*nhefs.iv$qsmk #install.packages(&quot;geepack&quot;) # install package if required library(&quot;geepack&quot;) g.est &lt;- geeglm(highprice ~ Hpsi, data=nhefs.iv, id=seqn, family=binomial(), corstr=&quot;independence&quot;) summary(g.est) #&gt; #&gt; Call: #&gt; geeglm(formula = highprice ~ Hpsi, family = binomial(), data = nhefs.iv, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 3.555e+00 1.652e-01 463.1 &lt;2e-16 *** #&gt; Hpsi 2.748e-07 2.273e-02 0.0 1 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 1 0.7607 #&gt; Number of clusters: 1476 Maximum cluster size: 1 beta &lt;- coef(g.est) SE &lt;- coef(summary(g.est))[,2] lcl &lt;- beta-qnorm(0.975)*SE ucl &lt;- beta+qnorm(0.975)*SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 3.555e+00 3.23152 3.87917 #&gt; Hpsi 2.748e-07 -0.04456 0.04456 Program 16.4 Estimating the average causal using the standard IV estimator with altnerative proposed instruments Data from NHEFS summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.6, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.6, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -55.6 -13.5 7.6 0.0 12.5 56.4 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -7.89 42.25 -0.187 0.852 #&gt; qsmk 41.28 164.95 0.250 0.802 #&gt; #&gt; Residual standard error: 18.6055 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.7, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.7, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -54.4 -13.4 -8.4 0.0 18.1 75.3 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 13.16 48.08 0.274 0.784 #&gt; qsmk -40.91 187.74 -0.218 0.828 #&gt; #&gt; Residual standard error: 20.591 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.8, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.8, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -49.37 -8.31 -3.44 0.00 7.27 60.53 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 8.086 7.288 1.110 0.267 #&gt; qsmk -21.103 28.428 -0.742 0.458 #&gt; #&gt; Residual standard error: 13.0188 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.9, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.9, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -47.24 -6.33 -1.43 0.00 5.52 54.36 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 5.963 6.067 0.983 0.326 #&gt; qsmk -12.811 23.667 -0.541 0.588 #&gt; #&gt; Residual standard error: 10.3637 on 1474 degrees of freedom Program 16.5 Estimating the average causal using the standard IV estimator Conditional on baseline covariates Data from NHEFS model2 &lt;- tsls(wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + as.factor(active) + wt71, ~ highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + as.factor(active) + wt71, data = nhefs.iv) summary(model2) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + #&gt; as.factor(exercise) + as.factor(active) + wt71 #&gt; #&gt; Instruments: ~highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + #&gt; as.factor(active) + wt71 #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -42.23 -4.29 -0.62 0.00 3.87 46.74 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 17.280330 2.335402 7.399 2.3e-13 *** #&gt; qsmk -1.042295 29.987369 -0.035 0.9723 #&gt; sex -1.644393 2.630831 -0.625 0.5320 #&gt; race -0.183255 4.650386 -0.039 0.9686 #&gt; age -0.163640 0.240548 -0.680 0.4964 #&gt; smokeintensity 0.005767 0.145504 0.040 0.9684 #&gt; smokeyrs 0.025836 0.161421 0.160 0.8729 #&gt; as.factor(exercise)1 0.498748 2.171239 0.230 0.8184 #&gt; as.factor(exercise)2 0.581834 2.183148 0.267 0.7899 #&gt; as.factor(active)1 -1.170145 0.607466 -1.926 0.0543 . #&gt; as.factor(active)2 -0.512284 1.308451 -0.392 0.6955 #&gt; wt71 -0.097949 0.036271 -2.701 0.0070 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Residual standard error: 7.7162 on 1464 degrees of freedom "],["causal-survival-analysis.html", "17. Causal survival analysis Program 17.1 Program 17.2 Program 17.3 Program 17.4 Program 17.5", " 17. Causal survival analysis Program 17.1 Nonparametric estimation of survival curves Data from NHEFS library(here) library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;,&quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$survtime &lt;- ifelse(nhefs$death==0, 120, (nhefs$yrdth-83)*12+nhefs$modth) # yrdth ranges from 83 to 92 table(nhefs$death, nhefs$qsmk) #&gt; #&gt; 0 1 #&gt; 0 985 326 #&gt; 1 216 102 summary(nhefs[which(nhefs$death==1),]$survtime) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 35.00 61.00 61.14 86.75 120.00 #install.packages(&quot;survival&quot;) #install.packages(&quot;ggplot2&quot;) # for plots #install.packages(&quot;survminer&quot;) # for plots library(&quot;survival&quot;) library(&quot;ggplot2&quot;) library(&quot;survminer&quot;) #&gt; Loading required package: ggpubr #&gt; #&gt; Attaching package: &#39;survminer&#39; #&gt; The following object is masked from &#39;package:survival&#39;: #&gt; #&gt; myeloma survdiff(Surv(survtime, death) ~ qsmk, data=nhefs) #&gt; Call: #&gt; survdiff(formula = Surv(survtime, death) ~ qsmk, data = nhefs) #&gt; #&gt; N Observed Expected (O-E)^2/E (O-E)^2/V #&gt; qsmk=0 1201 216 237.5 1.95 7.73 #&gt; qsmk=1 428 102 80.5 5.76 7.73 #&gt; #&gt; Chisq= 7.7 on 1 degrees of freedom, p= 0.005 fit &lt;- survfit(Surv(survtime, death) ~ qsmk, data=nhefs) ggsurvplot(fit, data = nhefs, xlab=&quot;Months of follow-up&quot;, ylab=&quot;Survival probability&quot;, main=&quot;Product-Limit Survival Estimates&quot;, risk.table = TRUE) Program 17.2 Parametric estimation of survival curves via hazards model Data from NHEFS # creation of person-month data #install.packages(&quot;splitstackshape&quot;) library(&quot;splitstackshape&quot;) nhefs.surv &lt;- expandRows(nhefs, &quot;survtime&quot;, drop=F) nhefs.surv$time &lt;- sequence(rle(nhefs.surv$seqn)$lengths)-1 nhefs.surv$event &lt;- ifelse(nhefs.surv$time==nhefs.surv$survtime-1 &amp; nhefs.surv$death==1, 1, 0) nhefs.surv$timesq &lt;- nhefs.surv$time^2 # fit of parametric hazards model hazards.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq, family=binomial(), data=nhefs.surv) summary(hazards.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq, family = binomial(), data = nhefs.surv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 6.996e+00 2.309e-01 30.292 &lt;2e-16 *** #&gt; qsmk -3.355e-01 3.970e-01 -0.845 0.3981 #&gt; I(qsmk * time) -1.208e-02 1.503e-02 -0.804 0.4215 #&gt; I(qsmk * timesq) 1.612e-04 1.246e-04 1.293 0.1960 #&gt; time -1.960e-02 8.413e-03 -2.329 0.0198 * #&gt; timesq 1.256e-04 6.686e-05 1.878 0.0604 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4655.3 on 176763 degrees of freedom #&gt; Residual deviance: 4631.3 on 176758 degrees of freedom #&gt; AIC: 4643.3 #&gt; #&gt; Number of Fisher Scoring iterations: 9 # creation of dataset with all time points under each treatment level qsmk0 &lt;- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2)) qsmk1 &lt;- data.frame(cbind(seq(0, 119),1,(seq(0, 119))^2)) colnames(qsmk0) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) colnames(qsmk1) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) # assignment of estimated (1-hazard) to each person-month */ qsmk0$p.noevent0 &lt;- predict(hazards.model, qsmk0, type=&quot;response&quot;) qsmk1$p.noevent1 &lt;- predict(hazards.model, qsmk1, type=&quot;response&quot;) # computation of survival for each person-month qsmk0$surv0 &lt;- cumprod(qsmk0$p.noevent0) qsmk1$surv1 &lt;- cumprod(qsmk1$p.noevent1) # some data management to plot estimated survival curves hazards.graph &lt;- merge(qsmk0, qsmk1, by=c(&quot;time&quot;, &quot;timesq&quot;)) hazards.graph$survdiff &lt;- hazards.graph$surv1-hazards.graph$surv0 # plot ggplot(hazards.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from hazards model&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.3 Estimation of survival curves via IP weighted hazards model Data from NHEFS # estimation of denominator of ip weights p.denom &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) nhefs$pd.qsmk &lt;- predict(p.denom, nhefs, type=&quot;response&quot;) # estimation of numerator of ip weights p.num &lt;- glm(qsmk ~ 1, data=nhefs, family=binomial()) nhefs$pn.qsmk &lt;- predict(p.num, nhefs, type=&quot;response&quot;) # computation of estimated weights nhefs$sw.a &lt;- ifelse(nhefs$qsmk==1, nhefs$pn.qsmk/nhefs$pd.qsmk, (1-nhefs$pn.qsmk)/(1-nhefs$pd.qsmk)) summary(nhefs$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.3312 0.8640 0.9504 0.9991 1.0755 4.2054 # creation of person-month data nhefs.ipw &lt;- expandRows(nhefs, &quot;survtime&quot;, drop=F) nhefs.ipw$time &lt;- sequence(rle(nhefs.ipw$seqn)$lengths)-1 nhefs.ipw$event &lt;- ifelse(nhefs.ipw$time==nhefs.ipw$survtime-1 &amp; nhefs.ipw$death==1, 1, 0) nhefs.ipw$timesq &lt;- nhefs.ipw$time^2 # fit of weighted hazards model ipw.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq, family=binomial(), weight=sw.a, data=nhefs.ipw) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(ipw.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq, family = binomial(), data = nhefs.ipw, weights = sw.a) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 6.897e+00 2.208e-01 31.242 &lt;2e-16 *** #&gt; qsmk 1.794e-01 4.399e-01 0.408 0.6834 #&gt; I(qsmk * time) -1.895e-02 1.640e-02 -1.155 0.2481 #&gt; I(qsmk * timesq) 2.103e-04 1.352e-04 1.556 0.1198 #&gt; time -1.889e-02 8.053e-03 -2.345 0.0190 * #&gt; timesq 1.181e-04 6.399e-05 1.846 0.0649 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4643.9 on 176763 degrees of freedom #&gt; Residual deviance: 4626.2 on 176758 degrees of freedom #&gt; AIC: 4633.5 #&gt; #&gt; Number of Fisher Scoring iterations: 9 # creation of survival curves ipw.qsmk0 &lt;- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2)) ipw.qsmk1 &lt;- data.frame(cbind(seq(0, 119),1,(seq(0, 119))^2)) colnames(ipw.qsmk0) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) colnames(ipw.qsmk1) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) # assignment of estimated (1-hazard) to each person-month */ ipw.qsmk0$p.noevent0 &lt;- predict(ipw.model, ipw.qsmk0, type=&quot;response&quot;) ipw.qsmk1$p.noevent1 &lt;- predict(ipw.model, ipw.qsmk1, type=&quot;response&quot;) # computation of survival for each person-month ipw.qsmk0$surv0 &lt;- cumprod(ipw.qsmk0$p.noevent0) ipw.qsmk1$surv1 &lt;- cumprod(ipw.qsmk1$p.noevent1) # some data management to plot estimated survival curves ipw.graph &lt;- merge(ipw.qsmk0, ipw.qsmk1, by=c(&quot;time&quot;, &quot;timesq&quot;)) ipw.graph$survdiff &lt;- ipw.graph$surv1-ipw.graph$surv0 # plot ggplot(ipw.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from IP weighted hazards model&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.4 Estimating of survival curves via g-formula Data from NHEFS # fit of hazards model with covariates gf.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smkintensity82_71 + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs.surv, family=binomial()) summary(gf.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq + sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smkintensity82_71 + #&gt; smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71), family = binomial(), #&gt; data = nhefs.surv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 9.272e+00 1.379e+00 6.724 1.76e-11 *** #&gt; qsmk 5.959e-02 4.154e-01 0.143 0.885924 #&gt; I(qsmk * time) -1.485e-02 1.506e-02 -0.987 0.323824 #&gt; I(qsmk * timesq) 1.702e-04 1.245e-04 1.367 0.171643 #&gt; time -2.270e-02 8.437e-03 -2.690 0.007142 ** #&gt; timesq 1.174e-04 6.709e-05 1.751 0.080020 . #&gt; sex 4.368e-01 1.409e-01 3.101 0.001930 ** #&gt; race -5.240e-02 1.734e-01 -0.302 0.762572 #&gt; age -8.750e-02 5.907e-02 -1.481 0.138536 #&gt; I(age * age) 8.128e-05 5.470e-04 0.149 0.881865 #&gt; as.factor(education)2 1.401e-01 1.566e-01 0.895 0.370980 #&gt; as.factor(education)3 4.335e-01 1.526e-01 2.841 0.004502 ** #&gt; as.factor(education)4 2.350e-01 2.790e-01 0.842 0.399750 #&gt; as.factor(education)5 3.750e-01 2.386e-01 1.571 0.116115 #&gt; smokeintensity -1.626e-03 1.430e-02 -0.114 0.909431 #&gt; I(smokeintensity * smokeintensity) -7.182e-05 2.390e-04 -0.301 0.763741 #&gt; smkintensity82_71 -1.686e-03 6.501e-03 -0.259 0.795399 #&gt; smokeyrs -1.677e-02 3.065e-02 -0.547 0.584153 #&gt; I(smokeyrs * smokeyrs) -5.280e-05 4.244e-04 -0.124 0.900997 #&gt; as.factor(exercise)1 1.469e-01 1.792e-01 0.820 0.412300 #&gt; as.factor(exercise)2 -1.504e-01 1.762e-01 -0.854 0.393177 #&gt; as.factor(active)1 -1.601e-01 1.300e-01 -1.232 0.218048 #&gt; as.factor(active)2 -2.294e-01 1.877e-01 -1.222 0.221766 #&gt; wt71 6.222e-02 1.902e-02 3.271 0.001073 ** #&gt; I(wt71 * wt71) -4.046e-04 1.129e-04 -3.584 0.000338 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4655.3 on 176763 degrees of freedom #&gt; Residual deviance: 4185.7 on 176739 degrees of freedom #&gt; AIC: 4235.7 #&gt; #&gt; Number of Fisher Scoring iterations: 10 # creation of dataset with all time points for # each individual under each treatment level gf.qsmk0 &lt;- expandRows(nhefs, count=120, count.is.col=F) gf.qsmk0$time &lt;- rep(seq(0, 119), nrow(nhefs)) gf.qsmk0$timesq &lt;- gf.qsmk0$time^2 gf.qsmk0$qsmk &lt;- 0 gf.qsmk1 &lt;- gf.qsmk0 gf.qsmk1$qsmk &lt;- 1 gf.qsmk0$p.noevent0 &lt;- predict(gf.model, gf.qsmk0, type=&quot;response&quot;) gf.qsmk1$p.noevent1 &lt;- predict(gf.model, gf.qsmk1, type=&quot;response&quot;) #install.packages(&quot;dplyr&quot;) library(&quot;dplyr&quot;) #&gt; #&gt; Attaching package: &#39;dplyr&#39; #&gt; The following objects are masked from &#39;package:stats&#39;: #&gt; #&gt; filter, lag #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; intersect, setdiff, setequal, union gf.qsmk0.surv &lt;- gf.qsmk0 %&gt;% group_by(seqn) %&gt;% mutate(surv0 = cumprod(p.noevent0)) gf.qsmk1.surv &lt;- gf.qsmk1 %&gt;% group_by(seqn) %&gt;% mutate(surv1 = cumprod(p.noevent1)) gf.surv0 &lt;- aggregate(gf.qsmk0.surv, by = list(gf.qsmk0.surv$time), FUN = mean)[c(&quot;qsmk&quot;, &quot;time&quot;, &quot;surv0&quot;)] gf.surv1 &lt;- aggregate(gf.qsmk1.surv, by = list(gf.qsmk1.surv$time), FUN = mean)[c(&quot;qsmk&quot;, &quot;time&quot;, &quot;surv1&quot;)] gf.graph &lt;- merge(gf.surv0, gf.surv1, by=c(&quot;time&quot;)) gf.graph$survdiff &lt;- gf.graph$surv1-gf.graph$surv0 # plot ggplot(gf.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from g-formula&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.5 Estimating of median survival time ratio via a structural nested AFT model Data from NHEFS # some preprocessing of the data nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$survtime &lt;- ifelse(nhefs$death == 0, NA, (nhefs$yrdth - 83) * 12 + nhefs$modth) # * yrdth ranges from 83 to 92 # model to estimate E[A|L] modelA &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) nhefs$p.qsmk &lt;- predict(modelA, nhefs, type=&quot;response&quot;) d &lt;- nhefs[!is.na(nhefs$survtime),] # select only those with observed death time n &lt;- nrow(d) # define the estimating function that needs to be minimized sumeef &lt;- function(psi){ # creation of delta indicator if (psi&gt;=0){ delta &lt;- ifelse(d$qsmk==0 | (d$qsmk==1 &amp; psi &lt;= log(120/d$survtime)), 1, 0) } else if (psi &lt; 0) { delta &lt;- ifelse(d$qsmk==1 | (d$qsmk==0 &amp; psi &gt; log(d$survtime/120)), 1, 0) } smat &lt;- delta*(d$qsmk-d$p.qsmk) sval &lt;- sum(smat, na.rm=T) save &lt;- sval/n smat &lt;- smat - rep(save, n) # covariance sigma &lt;- t(smat) %*% smat if (sigma == 0){ sigma &lt;- 1e-16 } estimeq &lt;- sval*solve(sigma)*t(sval) return(estimeq) } res &lt;- optimize(sumeef, interval = c(-0.2,0.2)) psi1 &lt;- res$minimum objfunc &lt;- as.numeric(res$objective) # Use simple bisection method to find estimates of lower and upper 95% confidence bounds increm &lt;- 0.1 for_conf &lt;- function(x){ return(sumeef(x) - 3.84) } if (objfunc &lt; 3.84){ # Find estimate of where sumeef(x) &gt; 3.84 # Lower bound of 95% CI psilow &lt;- psi1 testlow &lt;- objfunc countlow &lt;- 0 while (testlow &lt; 3.84 &amp; countlow &lt; 100){ psilow &lt;- psilow - increm testlow &lt;- sumeef(psilow) countlow &lt;- countlow + 1 } # Upper bound of 95% CI psihigh &lt;- psi1 testhigh &lt;- objfunc counthigh &lt;- 0 while (testhigh &lt; 3.84 &amp; counthigh &lt; 100){ psihigh &lt;- psihigh + increm testhigh &lt;- sumeef(psihigh) counthigh &lt;- counthigh + 1 } # Better estimate using bisection method if ((testhigh &gt; 3.84) &amp; (testlow &gt; 3.84)){ # Bisection method left &lt;- psi1 fleft &lt;- objfunc - 3.84 right &lt;- psihigh fright &lt;- testhigh - 3.84 middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- 0 diff &lt;- right - left while (!(abs(fmiddle) &lt; 0.0001 | diff &lt; 0.0001 | count &gt; 100)){ test &lt;- fmiddle * fleft if (test &lt; 0){ right &lt;- middle fright &lt;- fmiddle } else { left &lt;- middle fleft &lt;- fmiddle } middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- count + 1 diff &lt;- right - left } psi_high &lt;- middle objfunc_high &lt;- fmiddle + 3.84 # lower bound of 95% CI left &lt;- psilow fleft &lt;- testlow - 3.84 right &lt;- psi1 fright &lt;- objfunc - 3.84 middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- 0 diff &lt;- right - left while(!(abs(fmiddle) &lt; 0.0001 | diff &lt; 0.0001 | count &gt; 100)){ test &lt;- fmiddle * fleft if (test &lt; 0){ right &lt;- middle fright &lt;- fmiddle } else { left &lt;- middle fleft &lt;- fmiddle } middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) diff &lt;- right - left count &lt;- count + 1 } psi_low &lt;- middle objfunc_low &lt;- fmiddle + 3.84 psi &lt;- psi1 } } c(psi, psi_low, psi_high) #&gt; [1] -0.05041591 -0.22312099 0.33312901 "],["session-information-r.html", "Session information: R", " Session information: R For reproducibility. # install.packages(&quot;sessioninfo&quot;) sessioninfo::session_info() #&gt; ─ Session info ─────────────────────────────────────────────────────────────── #&gt; setting value #&gt; version R version 4.4.0 (2024-04-24) #&gt; os macOS Sonoma 14.4.1 #&gt; system aarch64, darwin20 #&gt; ui X11 #&gt; language (EN) #&gt; collate en_US.UTF-8 #&gt; ctype en_US.UTF-8 #&gt; tz Europe/London #&gt; date 2024-04-25 #&gt; pandoc 3.1.13 @ /opt/homebrew/bin/ (via rmarkdown) #&gt; #&gt; ─ Packages ─────────────────────────────────────────────────────────────────── #&gt; package * version date (UTC) lib source #&gt; bookdown 0.39 2024-04-15 [1] CRAN (R 4.4.0) #&gt; bslib 0.7.0 2024-03-29 [1] CRAN (R 4.4.0) #&gt; cachem 1.0.8 2023-05-01 [1] CRAN (R 4.4.0) #&gt; cli 3.6.2 2023-12-11 [1] CRAN (R 4.4.0) #&gt; digest 0.6.35 2024-03-11 [1] CRAN (R 4.4.0) #&gt; evaluate 0.23 2023-11-01 [1] CRAN (R 4.4.0) #&gt; fastmap 1.1.1 2023-02-24 [1] CRAN (R 4.4.0) #&gt; htmltools 0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0) #&gt; jquerylib 0.1.4 2021-04-26 [1] CRAN (R 4.4.0) #&gt; jsonlite 1.8.8 2023-12-04 [1] CRAN (R 4.4.0) #&gt; knitr 1.46 2024-04-06 [1] CRAN (R 4.4.0) #&gt; lifecycle 1.0.4 2023-11-07 [1] CRAN (R 4.4.0) #&gt; R6 2.5.1 2021-08-19 [1] CRAN (R 4.4.0) #&gt; rlang 1.1.3 2024-01-10 [1] CRAN (R 4.4.0) #&gt; rmarkdown 2.26 2024-03-05 [1] CRAN (R 4.4.0) #&gt; rstudioapi 0.16.0 2024-03-24 [1] CRAN (R 4.4.0) #&gt; sass 0.4.9 2024-03-15 [1] CRAN (R 4.4.0) #&gt; sessioninfo 1.2.2 2021-12-06 [1] CRAN (R 4.4.0) #&gt; xfun 0.43 2024-03-25 [1] CRAN (R 4.4.0) #&gt; yaml 2.3.8 2023-12-11 [1] CRAN (R 4.4.0) #&gt; #&gt; [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library #&gt; #&gt; ────────────────────────────────────────────────────────────────────────────── "],["why-model-stata.html", "11. Why model: Stata Program 11.1 Program 11.2 Program 11.3", " 11. Why model: Stata library(Statamarkdown) do dependency checking extremes consistency and verifying not already installed... all files already exist and are up to date. checking tomata consistency and verifying not already installed... all files already exist and are up to date. /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 11.1 Figures 11.1, 11.2, and 11.3 Sample averages by treatment level clear **Figure 11.1** *create the dataset* input A Y 1 200 1 150 1 220 1 110 1 50 1 180 1 90 1 170 0 170 0 30 0 70 0 110 0 80 0 50 0 10 0 20 end *Save the data* qui save ./data/fig1, replace *Build the scatterplot* scatter Y A, ylab(0(50)250) xlab(0 1) xscale(range(-0.5 1.5)) qui gr export figs/stata-fig-11-1.png, replace *Output the mean values for Y in each level of A* bysort A: sum Y A Y 1. 1 200 2. 1 150 3. 1 220 4. 1 110 5. 1 50 6. 1 180 7. 1 90 8. 1 170 9. 0 170 10. 0 30 11. 0 70 12. 0 110 13. 0 80 14. 0 50 15. 0 10 16. 0 20 17. end -------------------------------------------------------------------------------------- -&gt; A = 0 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 8 67.5 53.11712 10 170 -------------------------------------------------------------------------------------- -&gt; A = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 8 146.25 58.2942 50 220 *Clear the workspace to be able to use a new dataset* clear **Figure 11.2** input A Y 1 110 1 80 1 50 1 40 2 170 2 30 2 70 2 50 3 110 3 50 3 180 3 130 4 200 4 150 4 220 4 210 end qui save ./data/fig2, replace scatter Y A, ylab(0(50)250) xlab(0(1)4) xscale(range(0 4.5)) qui gr export figs/stata-fig-11-2.png, replace bysort A: sum Y A Y 1. 1 110 2. 1 80 3. 1 50 4. 1 40 5. 2 170 6. 2 30 7. 2 70 8. 2 50 9. 3 110 10. 3 50 11. 3 180 12. 3 130 13. 4 200 14. 4 150 15. 4 220 16. 4 210 17. end -------------------------------------------------------------------------------------- -&gt; A = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 70 31.62278 40 110 -------------------------------------------------------------------------------------- -&gt; A = 2 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 80 62.18253 30 170 -------------------------------------------------------------------------------------- -&gt; A = 3 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 117.5 53.77422 50 180 -------------------------------------------------------------------------------------- -&gt; A = 4 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 195 31.09126 150 220 clear **Figure 11.3** input A Y 3 21 11 54 17 33 23 101 29 85 37 65 41 157 53 120 67 111 79 200 83 140 97 220 60 230 71 217 15 11 45 190 end qui save ./data/fig3, replace scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) qui gr export figs/stata-fig-11-3.png, replace A Y 1. 3 21 2. 11 54 3. 17 33 4. 23 101 5. 29 85 6. 37 65 7. 41 157 8. 53 120 9. 67 111 10. 79 200 11. 83 140 12. 97 220 13. 60 230 14. 71 217 15. 15 11 16. 45 190 17. end Program 11.2 2-parameter linear model Creates Figure 11.4, parameter estimates with 95% confidence intervals from Section 11.2, and parameter estimates with 95% confidence intervals from Section 11.3 **Section 11.2: parametric estimators** *Reload data use ./data/fig3, clear *Plot the data* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) *Fit the regression model* regress Y A, noheader cformat(%5.2f) *Output the estimated mean Y value when A = 90* lincom _b[_cons] + 90*_b[A] *Plot the data with the regression line: Fig 11.4* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) || lfit Y A qui gr export figs/stata-fig-11-4.png, replace Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 2.14 0.40 5.35 0.000 1.28 2.99 _cons | 24.55 21.33 1.15 0.269 -21.20 70.29 ------------------------------------------------------------------------------ ( 1) 90*A + _cons = 0 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 216.89 20.8614 10.40 0.000 172.1468 261.6333 ------------------------------------------------------------------------------ **Section 11.3: non-parametric estimation* * Reload the data use ./data/fig1, clear *Fit the regression model* regress Y A, noheader cformat(%5.2f) *E[Y|A=1]* di 67.50 + 78.75 Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 78.75 27.88 2.82 0.014 18.95 138.55 _cons | 67.50 19.72 3.42 0.004 25.21 109.79 ------------------------------------------------------------------------------ 146.25 Program 11.3 3-parameter linear model Creates Figure 11.5 and Parameter estimates for Section 11.4 * Reload the data use ./data/fig3, clear *Create the product term* gen Asq = A*A *Fit the regression model* regress Y A Asq, noheader cformat(%5.2f) *Output the estimated mean Y value when A = 90* lincom _b[_cons] + 90*_b[A] + 90*90*_b[Asq] *Plot the data with the regression line: Fig 11.5* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) || qfit Y A qui gr export figs/stata-fig-11-5.png, replace Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 4.11 1.53 2.68 0.019 0.80 7.41 Asq | -0.02 0.02 -1.33 0.206 -0.05 0.01 _cons | -7.41 31.75 -0.23 0.819 -75.99 61.18 ------------------------------------------------------------------------------ ( 1) 90*A + 8100*Asq + _cons = 0 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 197.1269 25.16157 7.83 0.000 142.7687 251.4852 ------------------------------------------------------------------------------ "],["ip-weighting-and-marginal-structural-models-stata.html", "12. IP Weighting and Marginal Structural Models: Stata Program 12.1 Program 12.2 Program 12.3 Program 12.4 Program 12.5 Program 12.6 Program 12.7", " 12. IP Weighting and Marginal Structural Models: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 12.1 Descriptive statistics from NHEFS data (Table 12.1) use ./data/nhefs, clear /*Provisionally ignore subjects with missing values for follow-up weight*/ /*Sample size after exclusion: N = 1566*/ drop if wt82==. /* Calculate mean weight change in those with and without smoking cessation*/ label define qsmk 0 &quot;No smoking cessation&quot; 1 &quot;Smoking cessation&quot; label values qsmk qsmk by qsmk, sort: egen years = mean(age) if age &lt; . label var years &quot;Age, years&quot; by qsmk, sort: egen male = mean(100 * (sex==0)) if sex &lt; . label var male &quot;Men, %&quot; by qsmk, sort: egen white = mean(100 * (race==0)) if race &lt; . label var white &quot;White, %&quot; by qsmk, sort: egen university = mean(100 * (education == 5)) if education &lt; . label var university &quot;University, %&quot; by qsmk, sort: egen kg = mean(wt71) if wt71 &lt; . label var kg &quot;Weight, kg&quot; by qsmk, sort: egen cigs = mean(smokeintensity) if smokeintensity &lt; . label var cigs &quot;Cigarettes/day&quot; by qsmk, sort: egen meansmkyrs = mean(smokeyrs) if smokeyrs &lt; . label var kg &quot;Years smoking&quot; by qsmk, sort: egen noexer = mean(100 * (exercise == 2)) if exercise &lt; . label var noexer &quot;Little/no exercise&quot; by qsmk, sort: egen inactive = mean(100 * (active==2)) if active &lt; . label var inactive &quot;Inactive daily life&quot; qui save ./data/nhefs-formatted, replace (63 observations deleted) use ./data/nhefs-formatted, clear /*Output table*/ foreach var of varlist years male white university kg cigs meansmkyrs noexer inactive { tabdisp qsmk, cell(`var&#39;) format(%3.1f) } 2. tabdisp qsmk, cell(`var&#39;) format(%3.1f) 3. } --------------------------------- quit smoking between | baseline and 1982 | Age, years ---------------------+----------- No smoking cessation | 42.8 Smoking cessation | 46.2 --------------------------------- --------------------------------- quit smoking between | baseline and 1982 | Men, % ---------------------+----------- No smoking cessation | 46.6 Smoking cessation | 54.6 --------------------------------- --------------------------------- quit smoking between | baseline and 1982 | White, % ---------------------+----------- No smoking cessation | 85.4 Smoking cessation | 91.1 --------------------------------- ------------------------------------ quit smoking between | baseline and 1982 | University, % ---------------------+-------------- No smoking cessation | 9.9 Smoking cessation | 15.4 ------------------------------------ ------------------------------------ quit smoking between | baseline and 1982 | Years smoking ---------------------+-------------- No smoking cessation | 70.3 Smoking cessation | 72.4 ------------------------------------ ------------------------------------- quit smoking between | baseline and 1982 | Cigarettes/day ---------------------+--------------- No smoking cessation | 21.2 Smoking cessation | 18.6 ------------------------------------- --------------------------------- quit smoking between | baseline and 1982 | meansmkyrs ---------------------+----------- No smoking cessation | 24.1 Smoking cessation | 26.0 --------------------------------- ----------------------------------------- quit smoking between | baseline and 1982 | Little/no exercise ---------------------+------------------- No smoking cessation | 37.9 Smoking cessation | 40.7 ----------------------------------------- ------------------------------------------ quit smoking between | baseline and 1982 | Inactive daily life ---------------------+-------------------- No smoking cessation | 8.9 Smoking cessation | 11.2 ------------------------------------------ Program 12.2 Estimating IP weights for Section 12.2 Data from NHEFS use ./data/nhefs-formatted, clear /*Fit a logistic model for the IP weights*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 /*Output predicted conditional probability of quitting smoking for each individual*/ predict p_qsmk, pr /*Generate nonstabilized weights as P(A=1|covariates) if A = 1 and */ /* 1-P(A=1|covariates) if A = 0*/ gen w=. replace w=1/p_qsmk if qsmk==1 replace w=1/(1-p_qsmk) if qsmk==0 /*Check the mean of the weights; we expect it to be close to 2.0*/ summarize w /*Fit marginal structural model in the pseudopopulation*/ /*Weights assigned using pweight = w*/ /*Robust standard errors using cluster() option where &#39;seqn&#39; is the ID variable*/ regress wt82_71 qsmk [pweight=w], cluster(seqn) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- w | 1,566 1.996284 1.474787 1.053742 16.70009 (sum of wgt is 3,126.18084549904) Linear regression Number of obs = 1,566 F(1, 1565) = 42.81 Prob &gt; F = 0.0000 R-squared = 0.0435 Root MSE = 8.0713 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.440535 .5258294 6.54 0.000 2.409131 4.47194 _cons | 1.779978 .2248742 7.92 0.000 1.338892 2.221065 ------------------------------------------------------------------------------ Program 12.3 Estimating stabilized IP weights for Section 12.3 Data from NHEFS use ./data/nhefs-formatted, clear /*Fit a logistic model for the denominator of the IP weights and predict the */ /* conditional probability of smoking */ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */ logit qsmk predict pn_qsmk, pr /*Generate stabilized weights as f(A)/f(A|L)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 /*Check distribution of the stabilized weights*/ summarize sw_a /*Fit marginal structural model in the pseudopopulation*/ regress wt82_71 qsmk [pweight=sw_a], cluster(seqn) /********************************************************** FINE POINT 12.2 Checking positivity **********************************************************/ /*Check for missing values within strata of covariates, for example: */ tab age qsmk if race==0 &amp; sex==1 &amp; wt82!=. tab age qsmk if race==1 &amp; sex==1 &amp; wt82!=. Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = 0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,566 .9988444 .2882233 .3312489 4.297662 (sum of wgt is 1,564.19025221467) Linear regression Number of obs = 1,566 F(1, 1565) = 42.81 Prob &gt; F = 0.0000 R-squared = 0.0359 Root MSE = 7.7972 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.440535 .5258294 6.54 0.000 2.409131 4.47194 _cons | 1.779978 .2248742 7.92 0.000 1.338892 2.221065 ------------------------------------------------------------------------------ | quit smoking between | baseline and 1982 age | No smokin Smoking c | Total -----------+----------------------+---------- 25 | 24 3 | 27 26 | 14 5 | 19 27 | 18 2 | 20 28 | 20 5 | 25 29 | 15 4 | 19 30 | 14 5 | 19 31 | 11 5 | 16 32 | 14 7 | 21 33 | 12 3 | 15 34 | 22 5 | 27 35 | 16 5 | 21 36 | 13 3 | 16 37 | 14 1 | 15 38 | 6 2 | 8 39 | 19 4 | 23 40 | 10 4 | 14 41 | 13 3 | 16 42 | 16 3 | 19 43 | 14 3 | 17 44 | 9 4 | 13 45 | 12 5 | 17 46 | 19 4 | 23 47 | 19 4 | 23 48 | 19 4 | 23 49 | 11 3 | 14 50 | 18 4 | 22 51 | 9 3 | 12 52 | 11 3 | 14 53 | 11 4 | 15 54 | 17 9 | 26 55 | 9 4 | 13 56 | 8 7 | 15 57 | 9 2 | 11 58 | 8 4 | 12 59 | 5 4 | 9 60 | 5 4 | 9 61 | 5 2 | 7 62 | 6 5 | 11 63 | 3 3 | 6 64 | 7 1 | 8 65 | 3 2 | 5 66 | 4 0 | 4 67 | 2 0 | 2 69 | 6 2 | 8 70 | 2 1 | 3 71 | 0 1 | 1 72 | 2 2 | 4 74 | 0 1 | 1 -----------+----------------------+---------- Total | 524 164 | 688 | quit smoking between | baseline and 1982 age | No smokin Smoking c | Total -----------+----------------------+---------- 25 | 3 1 | 4 26 | 3 0 | 3 28 | 3 1 | 4 29 | 1 0 | 1 30 | 4 0 | 4 31 | 3 0 | 3 32 | 8 0 | 8 33 | 2 0 | 2 34 | 2 1 | 3 35 | 3 0 | 3 36 | 5 0 | 5 37 | 3 1 | 4 38 | 4 2 | 6 39 | 1 1 | 2 40 | 2 2 | 4 41 | 3 0 | 3 42 | 3 0 | 3 43 | 4 2 | 6 44 | 3 0 | 3 45 | 1 3 | 4 46 | 5 0 | 5 47 | 3 0 | 3 48 | 4 0 | 4 49 | 1 1 | 2 50 | 2 0 | 2 51 | 4 0 | 4 52 | 1 0 | 1 53 | 2 0 | 2 54 | 2 0 | 2 55 | 3 0 | 3 56 | 2 1 | 3 57 | 2 1 | 3 61 | 1 1 | 2 67 | 1 0 | 1 68 | 1 0 | 1 69 | 2 0 | 2 70 | 0 1 | 1 -----------+----------------------+---------- Total | 97 19 | 116 Program 12.4 Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS Section 12.4 use ./data/nhefs-formatted, clear * drop sw_a /*Analysis restricted to subjects reporting &lt;=25 cig/day at baseline: N = 1162*/ keep if smokeintensity &lt;=25 /*Fit a linear model for the denominator of the IP weights and calculate the */ /* mean expected smoking intensity*/ regress smkintensity82_71 sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 quietly predict p_den /*Generate the denisty of the denomiator expectation using the mean expected */ /* smoking intensity and the residuals, assuming a normal distribution*/ /*Note: The regress command in Stata saves the root mean squared error for the */ /* immediate regression as e(rmse), thus there is no need to calculate it again. */ gen dens_den = normalden(smkintensity82_71, p_den, e(rmse)) /*Fit a linear model for the numerator of ip weights, calculate the mean */ /* expected value, and generate the density*/ quietly regress smkintensity82_71 quietly predict p_num gen dens_num = normalden( smkintensity82_71, p_num, e(rmse)) /*Generate the final stabilized weights from the estimated numerator and */ /* denominator, and check the weights distribution*/ gen sw_a=dens_num/dens_den summarize sw_a /*Fit a marginal structural model in the pseudopopulation*/ regress wt82_71 c.smkintensity82_71##c.smkintensity82_71 [pweight=sw_a], cluster(seqn) /*Output the estimated mean Y value when smoke intensity is unchanged from */ /* baseline to 1982 */ lincom _b[_cons] /*Output the estimated mean Y value when smoke intensity increases by 20 from */ /* baseline to 1982*/ lincom _b[_cons] + 20*_b[smkintensity82_71 ] + /// 400*_b[c.smkintensity82_71#c.smkintensity82_71] (404 observations deleted) Source | SS df MS Number of obs = 1,162 -------------+---------------------------------- F(18, 1143) = 5.39 Model | 9956.95654 18 553.164252 Prob &gt; F = 0.0000 Residual | 117260.18 1,143 102.589834 R-squared = 0.0783 -------------+---------------------------------- Adj R-squared = 0.0638 Total | 127217.137 1,161 109.575484 Root MSE = 10.129 ----------------------------------------------------------------------------------- smkintensity82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | 1.087021 .7425694 1.46 0.144 -.3699308 2.543973 race | .2319789 .8434739 0.28 0.783 -1.422952 1.88691 age | -.8099902 .2555388 -3.17 0.002 -1.311368 -.3086124 | c.age#c.age | .0066545 .0026849 2.48 0.013 .0013865 .0119224 | education | 1 | 1.508097 1.184063 1.27 0.203 -.8150843 3.831278 2 | 2.02692 1.133772 1.79 0.074 -.1975876 4.251428 3 | 2.240314 1.022556 2.19 0.029 .2340167 4.246611 4 | 2.528767 1.44702 1.75 0.081 -.3103458 5.36788 | smokeintensity | -.3589684 .2246653 -1.60 0.110 -.799771 .0818342 | c.smokeintensity#| c.smokeintensity | .0019582 .0085753 0.23 0.819 -.0148668 .0187832 | smokeyrs | .3857088 .1416765 2.72 0.007 .1077336 .6636841 | c.smokeyrs#| c.smokeyrs | -.0054871 .0023837 -2.30 0.022 -.0101641 -.0008101 | exercise | 0 | 1.996904 .9080421 2.20 0.028 .215288 3.778521 1 | .988812 .6929239 1.43 0.154 -.3707334 2.348357 | active | 0 | .8451341 1.098573 0.77 0.442 -1.310312 3.000581 1 | .800114 1.08438 0.74 0.461 -1.327485 2.927712 | wt71 | -.0656882 .136955 -0.48 0.632 -.3343996 .2030232 | c.wt71#c.wt71 | .0005711 .000877 0.65 0.515 -.0011496 .0022918 | _cons | 16.86761 7.109189 2.37 0.018 2.91909 30.81614 ----------------------------------------------------------------------------------- Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,162 .9968057 .3222937 .1938336 5.102339 (sum of wgt is 1,158.28818286955) Linear regression Number of obs = 1,162 F(2, 1161) = 12.75 Prob &gt; F = 0.0000 R-squared = 0.0233 Root MSE = 7.7864 (Std. err. adjusted for 1,162 clusters in seqn) ------------------------------------------------------------------------------------- | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] --------------------+---------------------------------------------------------------- smkintensity82_71 | -.1089889 .0315762 -3.45 0.001 -.1709417 -.0470361 | c. | smkintensity82_71#| c.smkintensity82_71 | .0026949 .0024203 1.11 0.266 -.0020537 .0074436 | _cons | 2.004525 .295502 6.78 0.000 1.424747 2.584302 ------------------------------------------------------------------------------------- ( 1) _cons = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 2.004525 .295502 6.78 0.000 1.424747 2.584302 ------------------------------------------------------------------------------ ( 1) 20*smkintensity82_71 + 400*c.smkintensity82_71#c.smkintensity82_71 + _cons = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | .9027234 1.310533 0.69 0.491 -1.668554 3.474001 ------------------------------------------------------------------------------ Program 12.5 Estimating the parameters of a marginal structural logistic model Data from NHEFS Section 12.4 use ./data/nhefs, clear /*Provisionally ignore subjects with missing values for follow-up weight*/ /*Sample size after exclusion: N = 1566*/ drop if wt82==. /*Estimate the stabilized weights for quitting smoking as in PROGRAM 12.3*/ /*Fit a logistic model for the denominator of the IP weights and predict the */ /* conditional probability of smoking*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */ logit qsmk predict pn_qsmk, pr /*Generate stabilized weights as f(A)/f(A|L)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 summarize sw_a /*Fit marginal structural model in the pseudopopulation*/ /*NOTE: Stata has two commands for logistic regression, logit and logistic*/ /*Using logistic allows us to output the odds ratios directly*/ /*We can also output odds ratios from the logit command using the or option */ /* (default logit output is regression coefficients*/ logistic death qsmk [pweight=sw_a], cluster(seqn) (63 observations deleted) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = -0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = -0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,566 .9988444 .2882233 .3312489 4.297662 Logistic regression Number of obs = 1,566 Wald chi2(1) = 0.04 Prob &gt; chi2 = 0.8482 Log pseudolikelihood = -749.11596 Pseudo R2 = 0.0000 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust death | Odds ratio std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 1.030578 .1621842 0.19 0.848 .7570517 1.402931 _cons | .2252711 .0177882 -18.88 0.000 .1929707 .2629781 ------------------------------------------------------------------------------ Note: _cons estimates baseline odds. Program 12.6 Assessing effect modification by sex using a marginal structural mean model Data from NHEFS Section 12.5 use ./data/nhefs, clear * drop pd_qsmk pn_qsmk sw_a /*Check distribution of sex*/ tab sex /*Fit logistc model for the denominator of IP weights, as in PROGRAM 12.3 */ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit logistic model for the numerator of IP weights, no including sex */ logit qsmk sex predict pn_qsmk, pr /*Generate IP weights as before*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 summarize sw_a /*Fit marginal structural model in the pseudopopulation, including interaction */ /* term between quitting smoking and sex*/ regress wt82_71 qsmk##sex [pw=sw_a], cluster(seqn) sex | Freq. Percent Cum. ------------+----------------------------------- 0 | 799 49.05 49.05 1 | 830 50.95 100.00 ------------+----------------------------------- Total | 1,629 100.00 Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -884.53806 Iteration 2: Log likelihood = -883.35064 Iteration 3: Log likelihood = -883.34876 Iteration 4: Log likelihood = -883.34876 Logistic regression Number of obs = 1,629 LR chi2(18) = 109.59 Prob &gt; chi2 = 0.0000 Log likelihood = -883.34876 Pseudo R2 = 0.0584 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5075218 .1482316 -3.42 0.001 -.7980505 -.2169932 race | -.8502312 .2058722 -4.13 0.000 -1.253733 -.4467292 age | .1030132 .0488996 2.11 0.035 .0071718 .1988547 | c.age#c.age | -.0006052 .0005074 -1.19 0.233 -.0015998 .0003893 | education | 1 | -.3796632 .2203948 -1.72 0.085 -.811629 .0523026 2 | -.4779835 .2141771 -2.23 0.026 -.8977629 -.0582041 3 | -.3639645 .1885776 -1.93 0.054 -.7335698 .0056409 4 | -.4221892 .2717235 -1.55 0.120 -.9547574 .110379 | smokeintensity | -.0651561 .0147589 -4.41 0.000 -.0940831 -.0362292 | c.smokeintensity#| c.smokeintensity | .0008461 .0002758 3.07 0.002 .0003054 .0013867 | smokeyrs | -.0733708 .0269958 -2.72 0.007 -.1262816 -.02046 | c.smokeyrs#| c.smokeyrs | .0008384 .0004435 1.89 0.059 -.0000307 .0017076 | exercise | 0 | -.3550517 .1799293 -1.97 0.048 -.7077067 -.0023967 1 | -.06364 .1351256 -0.47 0.638 -.3284812 .2012013 | active | 0 | -.0683123 .2087269 -0.33 0.743 -.4774095 .3407849 1 | -.057437 .2039967 -0.28 0.778 -.4572632 .3423892 | wt71 | -.0128478 .0222829 -0.58 0.564 -.0565214 .0308258 | c.wt71#c.wt71 | .0001209 .0001352 0.89 0.371 -.000144 .0003859 | _cons | -1.185875 1.263142 -0.94 0.348 -3.661588 1.289838 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -933.49896 Iteration 2: Log likelihood = -933.49126 Iteration 3: Log likelihood = -933.49126 Logistic regression Number of obs = 1,629 LR chi2(1) = 9.30 Prob &gt; chi2 = 0.0023 Log likelihood = -933.49126 Pseudo R2 = 0.0050 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- sex | -.3441893 .1131341 -3.04 0.002 -.565928 -.1224506 _cons | -.8634417 .0774517 -11.15 0.000 -1.015244 -.7116391 ------------------------------------------------------------------------------ (1,629 missing values generated) (428 real changes made) (1,201 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,629 .9991318 .2636164 .2901148 3.683352 (sum of wgt is 1,562.01032829285) Linear regression Number of obs = 1,566 F(3, 1565) = 16.31 Prob &gt; F = 0.0000 R-squared = 0.0379 Root MSE = 7.8024 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- 1.qsmk | 3.60623 .6576053 5.48 0.000 2.31635 4.89611 1.sex | -.0040025 .4496206 -0.01 0.993 -.8859246 .8779197 | qsmk#sex | 1 1 | -.161224 1.036143 -0.16 0.876 -2.1936 1.871152 | _cons | 1.759045 .3102511 5.67 0.000 1.150494 2.367597 ------------------------------------------------------------------------------ Program 12.7 Estimating IP weights to adjust for selection bias due to censoring Data from NHEFS Section 12.6 use ./data/nhefs, clear /*Analysis including all individuals regardless of missing wt82 status: N=1629*/ /*Generate censoring indicator: C = 1 if wt82 missing*/ gen byte cens = (wt82 == .) /*Check distribution of censoring by quitting smoking and baseline weight*/ tab cens qsmk, column bys cens: summarize wt71 /*Fit logistic regression model for the denominator of IP weight for A*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit logistic regression model for the numerator of IP weights for A*/ logit qsmk predict pn_qsmk, pr /*Fit logistic regression model for the denominator of IP weights for C, */ /* including quitting smoking*/ logit cens qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 predict pd_cens, pr /*Fit logistic regression model for the numerator of IP weights for C, */ /* including quitting smoking */ logit cens qsmk predict pn_cens, pr /*Generate the stabilized weights for A (sw_a)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 /*Generate the stabilized weights for C (sw_c)*/ /*NOTE: the conditional probability estimates generated by our logistic models */ /* for C represent the conditional probability of being censored (C=1)*/ /*We want weights for the conditional probability of bing uncensored, Pr(C=0|A,L)*/ gen sw_c=. replace sw_c=(1-pn_cens)/(1-pd_cens) if cens==0 /*Generate the final stabilized weights and check distribution*/ gen sw=sw_a*sw_c summarize sw /*Fit marginal structural model in the pseudopopulation*/ regress wt82_71 qsmk [pw=sw], cluster(seqn) | Key | |-------------------| | frequency | | column percentage | +-------------------+ | quit smoking between | baseline and 1982 cens | 0 1 | Total -----------+----------------------+---------- 0 | 1,163 403 | 1,566 | 96.84 94.16 | 96.13 -----------+----------------------+---------- 1 | 38 25 | 63 | 3.16 5.84 | 3.87 -----------+----------------------+---------- Total | 1,201 428 | 1,629 | 100.00 100.00 | 100.00 -------------------------------------------------------------------------------------- -&gt; cens = 0 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt71 | 1,566 70.83092 15.3149 39.58 151.73 -------------------------------------------------------------------------------------- -&gt; cens = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt71 | 63 76.55079 23.3326 36.17 169.19 Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -884.53806 Iteration 2: Log likelihood = -883.35064 Iteration 3: Log likelihood = -883.34876 Iteration 4: Log likelihood = -883.34876 Logistic regression Number of obs = 1,629 LR chi2(18) = 109.59 Prob &gt; chi2 = 0.0000 Log likelihood = -883.34876 Pseudo R2 = 0.0584 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5075218 .1482316 -3.42 0.001 -.7980505 -.2169932 race | -.8502312 .2058722 -4.13 0.000 -1.253733 -.4467292 age | .1030132 .0488996 2.11 0.035 .0071718 .1988547 | c.age#c.age | -.0006052 .0005074 -1.19 0.233 -.0015998 .0003893 | education | 1 | -.3796632 .2203948 -1.72 0.085 -.811629 .0523026 2 | -.4779835 .2141771 -2.23 0.026 -.8977629 -.0582041 3 | -.3639645 .1885776 -1.93 0.054 -.7335698 .0056409 4 | -.4221892 .2717235 -1.55 0.120 -.9547574 .110379 | smokeintensity | -.0651561 .0147589 -4.41 0.000 -.0940831 -.0362292 | c.smokeintensity#| c.smokeintensity | .0008461 .0002758 3.07 0.002 .0003054 .0013867 | smokeyrs | -.0733708 .0269958 -2.72 0.007 -.1262816 -.02046 | c.smokeyrs#| c.smokeyrs | .0008384 .0004435 1.89 0.059 -.0000307 .0017076 | exercise | 0 | -.3550517 .1799293 -1.97 0.048 -.7077067 -.0023967 1 | -.06364 .1351256 -0.47 0.638 -.3284812 .2012013 | active | 0 | -.0683123 .2087269 -0.33 0.743 -.4774095 .3407849 1 | -.057437 .2039967 -0.28 0.778 -.4572632 .3423892 | wt71 | -.0128478 .0222829 -0.58 0.564 -.0565214 .0308258 | c.wt71#c.wt71 | .0001209 .0001352 0.89 0.371 -.000144 .0003859 | _cons | -1.185875 1.263142 -0.94 0.348 -3.661588 1.289838 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -938.14308 Logistic regression Number of obs = 1,629 LR chi2(0) = 0.00 Prob &gt; chi2 = . Log likelihood = -938.14308 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.031787 .0562947 -18.33 0.000 -1.142122 -.9214511 ------------------------------------------------------------------------------ Iteration 0: Log likelihood = -266.67873 Iteration 1: Log likelihood = -238.48654 Iteration 2: Log likelihood = -232.82848 Iteration 3: Log likelihood = -232.68043 Iteration 4: Log likelihood = -232.67999 Iteration 5: Log likelihood = -232.67999 Logistic regression Number of obs = 1,629 LR chi2(19) = 68.00 Prob &gt; chi2 = 0.0000 Log likelihood = -232.67999 Pseudo R2 = 0.1275 ----------------------------------------------------------------------------------- cens | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | .5168674 .2877162 1.80 0.072 -.0470459 1.080781 sex | .0573131 .3302775 0.17 0.862 -.590019 .7046452 race | -.0122715 .4524888 -0.03 0.978 -.8991332 .8745902 age | -.2697293 .1174647 -2.30 0.022 -.4999559 -.0395027 | c.age#c.age | .0028837 .0011135 2.59 0.010 .0007012 .0050661 | education | 1 | .3823818 .5601808 0.68 0.495 -.7155523 1.480316 2 | -.0584066 .5749586 -0.10 0.919 -1.185305 1.068491 3 | .2176937 .5225008 0.42 0.677 -.8063891 1.241776 4 | .5208288 .6678735 0.78 0.435 -.7881792 1.829837 | smokeintensity | .0157119 .0347319 0.45 0.651 -.0523614 .0837851 | c.smokeintensity#| c.smokeintensity | -.0001133 .0006058 -0.19 0.852 -.0013007 .0010742 | smokeyrs | .0785973 .0749576 1.05 0.294 -.0683169 .2255116 | c.smokeyrs#| c.smokeyrs | -.0005569 .0010318 -0.54 0.589 -.0025791 .0014653 | exercise | 0 | .583989 .3723133 1.57 0.117 -.1457317 1.31371 1 | -.3874824 .3439133 -1.13 0.260 -1.06154 .2865754 | active | 0 | -.7065829 .3964577 -1.78 0.075 -1.483626 .0704599 1 | -.9540614 .3893181 -2.45 0.014 -1.717111 -.1910119 | wt71 | -.0878871 .0400115 -2.20 0.028 -.1663082 -.0094659 | c.wt71#c.wt71 | .0006351 .0002257 2.81 0.005 .0001927 .0010775 | _cons | 3.754678 2.651222 1.42 0.157 -1.441622 8.950978 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -266.67873 Iteration 1: Log likelihood = -264.00252 Iteration 2: Log likelihood = -263.88028 Iteration 3: Log likelihood = -263.88009 Iteration 4: Log likelihood = -263.88009 Logistic regression Number of obs = 1,629 LR chi2(1) = 5.60 Prob &gt; chi2 = 0.0180 Log likelihood = -263.88009 Pseudo R2 = 0.0105 ------------------------------------------------------------------------------ cens | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | .6411113 .2639262 2.43 0.015 .1238255 1.158397 _cons | -3.421172 .1648503 -20.75 0.000 -3.744273 -3.098071 ------------------------------------------------------------------------------ (1,629 missing values generated) (428 real changes made) (1,201 real changes made) (1,629 missing values generated) (1,566 real changes made) (63 missing values generated) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw | 1,566 .9962351 .2819583 .3546469 4.093113 (sum of wgt is 1,560.10419079661) Linear regression Number of obs = 1,566 F(1, 1565) = 44.19 Prob &gt; F = 0.0000 R-squared = 0.0363 Root MSE = 7.8652 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.496493 .5259796 6.65 0.000 2.464794 4.528192 _cons | 1.66199 .2328986 7.14 0.000 1.205164 2.118816 ------------------------------------------------------------------------------ "],["standardization-and-the-parametric-g-formula-stata.html", "13. Standardization and the parametric G-formula: Stata Program 13.1 Program 13.2 Program 13.3 Program 13.4", " 13. Standardization and the parametric G-formula: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 13.1 Estimating the mean outcome within levels of treatment and confounders: Data from NHEFS Section 13.2 use ./data/nhefs-formatted, clear /* Estimate the the conditional mean outcome within strata of quitting smoking and covariates, among the uncensored */ glm wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// qsmk##c.smokeintensity predict meanY summarize meanY /*Look at the predicted value for subject ID = 24770*/ list meanY if seqn == 24770 /*Observed mean outcome for comparison */ summarize wt82_71 note: 1.qsmk omitted because of collinearity. note: smokeintensity omitted because of collinearity. Iteration 0: Log likelihood = -5328.5765 Generalized linear models Number of obs = 1,566 Optimization : ML Residual df = 1,545 Scale parameter = 53.5683 Deviance = 82763.02862 (1/df) Deviance = 53.5683 Pearson = 82763.02862 (1/df) Pearson = 53.5683 Variance function: V(u) = 1 [Gaussian] Link function : g(u) = u [Identity] AIC = 6.832154 Log likelihood = -5328.576456 BIC = 71397.58 ------------------------------------------------------------------------------------ | OIM wt82_71 | Coefficient std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .973692 4.145496 sex | -1.430272 .4689576 -3.05 0.002 -2.349412 -.5111317 race | .5601096 .5818888 0.96 0.336 -.5803714 1.700591 age | .3596353 .1633188 2.20 0.028 .0395364 .6797342 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094841 -.0027178 | education | 1 | .194977 .7413692 0.26 0.793 -1.25808 1.648034 2 | .9854211 .7012116 1.41 0.160 -.3889285 2.359771 3 | .7512894 .6339153 1.19 0.236 -.4911617 1.993741 4 | 1.686547 .8716593 1.93 0.053 -.0218744 3.394967 | smokeintensity | .0491365 .0517254 0.95 0.342 -.0522435 .1505165 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028292 .0008479 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045384 .3141212 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048921 .0011592 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.449256 .7414301 1 | -.0579374 .4316468 -0.13 0.893 -.9039497 .7880749 | active | 0 | .2613779 .6845577 0.38 0.703 -1.08033 1.603086 1 | -.6861916 .6739131 -1.02 0.309 -2.007037 .6346539 | wt71 | .0455018 .0833709 0.55 0.585 -.1179022 .2089058 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019937 .0000631 | qsmk | Smoking cessation | 0 (omitted) smokeintensity | 0 (omitted) | qsmk#| c.smokeintensity | Smoking cessation | .0466628 .0351448 1.33 0.184 -.0222197 .1155453 | _cons | -1.690608 4.388883 -0.39 0.700 -10.29266 6.911444 ------------------------------------------------------------------------------------ (option mu assumed; predicted mean wt82_71) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanY | 1,566 2.6383 3.034683 -10.87582 9.876489 +----------+ | meanY | |----------| 960. | .3421569 | +----------+ Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt82_71 | 1,566 2.6383 7.879913 -41.28047 48.53839 Program 13.2 Standardizing the mean outcome to the baseline confounders Data from Table 2.2 Section 13.3 clear input str10 ID L A Y &quot;Rheia&quot; 0 0 0 &quot;Kronos&quot; 0 0 1 &quot;Demeter&quot; 0 0 0 &quot;Hades&quot; 0 0 0 &quot;Hestia&quot; 0 1 0 &quot;Poseidon&quot; 0 1 0 &quot;Hera&quot; 0 1 0 &quot;Zeus&quot; 0 1 1 &quot;Artemis&quot; 1 0 1 &quot;Apollo&quot; 1 0 1 &quot;Leto&quot; 1 0 0 &quot;Ares&quot; 1 1 1 &quot;Athena&quot; 1 1 1 &quot;Hephaestus&quot; 1 1 1 &quot;Aphrodite&quot; 1 1 1 &quot;Cyclope&quot; 1 1 1 &quot;Persephone&quot; 1 1 1 &quot;Hermes&quot; 1 1 0 &quot;Hebe&quot; 1 1 0 &quot;Dionysus&quot; 1 1 0 end /* i. Data set up for standardization: - create 3 copies of each subject first, - duplicate the dataset and create a variable `interv` which indicates which copy is the duplicate (interv =1) */ expand 2, generate(interv) /* Next, duplicate the original copy (interv = 0) again, and create another variable &#39;interv2&#39; to indicate the copy */ expand 2 if interv == 0, generate(interv2) /* Now, change the value of &#39;interv&#39; to -1 in one of the copies so that there are unique values of interv for each copy */ replace interv = -1 if interv2 ==1 drop interv2 /* Check that the data has the structure you want: - there should be 1566 people in each of the 3 levels of interv*/ tab interv /* Two of the copies will be for computing the standardized result for these two copies (interv = 0 and interv = 1), set the outcome to missing and force qsmk to either 0 or 1, respectively. You may need to edit this part of the code for your outcome and exposure variables */ replace Y = . if interv != -1 replace A = 0 if interv == 0 replace A = 1 if interv == 1 /* Check that the data has the structure you want: for interv = -1, some people quit and some do not; for interv = 0 or 1, noone quits or everyone quits, respectively */ by interv, sort: summarize A *ii.Estimation in original sample* *Now, we do a parametric regression with the covariates we want to adjust for* *You may need to edit this part of the code for the variables you want.* *Because the copies have missing Y, this will only run the regression in the *original copy.* *The double hash between A &amp; L creates a regression model with A and L and a * product term between A and L* regress Y A##L *Ask Stata for expected values - Stata will give you expected values for all * copies, not just the original ones* predict predY, xb *Now ask for a summary of these values by intervention* *These are the standardized outcome estimates: you can subtract them to get the * standardized difference* by interv, sort: summarize predY *iii.OPTIONAL: Output standardized point estimates and difference* *The summary from the last command gives you the standardized estimates* *We can stop there, or we can ask Stata to calculate the standardized difference * and display all the results in a simple table* *The code below can be used as-is without changing any variable names* *The option &quot;quietly&quot; asks Stata not to display the output of some intermediate * calculations* *You can delete this option if you want to see what is happening step-by-step* quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) *Add some row/column descriptions and print results to screen* matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe *to interpret these results:* *row 1, column 2, is the observed mean outcome value in our original sample* *row 2, column 2, is the mean outcome value if everyone had not quit smoking* *row 3, column 2, is the mean outcome value if everyone had quit smoking* *row 4, column 2, is the mean difference outcome value if everyone had quit * smoking compared to if everyone had not quit smoking* ID L A Y 1. &quot;Rheia&quot; 0 0 0 2. &quot;Kronos&quot; 0 0 1 3. &quot;Demeter&quot; 0 0 0 4. &quot;Hades&quot; 0 0 0 5. &quot;Hestia&quot; 0 1 0 6. &quot;Poseidon&quot; 0 1 0 7. &quot;Hera&quot; 0 1 0 8. &quot;Zeus&quot; 0 1 1 9. &quot;Artemis&quot; 1 0 1 10. &quot;Apollo&quot; 1 0 1 11. &quot;Leto&quot; 1 0 0 12. &quot;Ares&quot; 1 1 1 13. &quot;Athena&quot; 1 1 1 14. &quot;Hephaestus&quot; 1 1 1 15. &quot;Aphrodite&quot; 1 1 1 16. &quot;Cyclope&quot; 1 1 1 17. &quot;Persephone&quot; 1 1 1 18. &quot;Hermes&quot; 1 1 0 19. &quot;Hebe&quot; 1 1 0 20. &quot;Dionysus&quot; 1 1 0 21. end (20 observations created) (20 observations created) (20 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 20 33.33 33.33 Original observation | 20 33.33 66.67 Duplicated observation | 20 33.33 100.00 -----------------------+----------------------------------- Total | 60 100.00 (40 real changes made, 40 to missing) (13 real changes made) (7 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 .65 .4893605 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 1 0 1 1 Source | SS df MS Number of obs = 20 -------------+---------------------------------- F(3, 16) = 1.07 Model | .833333333 3 .277777778 Prob &gt; F = 0.3909 Residual | 4.16666667 16 .260416667 R-squared = 0.1667 -------------+---------------------------------- Adj R-squared = 0.0104 Total | 5 19 .263157895 Root MSE = .51031 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- 1.A | 1.05e-16 .3608439 0.00 1.000 -.7649549 .7649549 1.L | .4166667 .389756 1.07 0.301 -.4095791 1.242912 | A#L | 1 1 | -5.83e-17 .4959325 -0.00 1.000 -1.05133 1.05133 | _cons | .25 .2551552 0.98 0.342 -.2909048 .7909048 ------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 observe[4,2] interv value observed -1 .50000001 E(Y(a=0)) 0 .50000001 E(Y(a=1)) 1 .50000001 difference . 0 Program 13.3 Standardizing the mean outcome to the baseline confounders: Data from NHEFS Section 13.3 use ./data/nhefs-formatted, clear *i.Data set up for standardization: create 3 copies of each subject* *first, duplicate the dataset and create a variable &#39;interv&#39; which indicates * which copy is the duplicate (interv =1) expand 2, generate(interv) *next, duplicate the original copy (interv = 0) again, and create another * variable &#39;interv2&#39; to indicate the copy expand 2 if interv == 0, generate(interv2) *now, change the value of &#39;interv&#39; to -1 in one of the copies so that there are * unique values of interv for each copy* replace interv = -1 if interv2 ==1 drop interv2 *check that the data has the structure you want: there should be 1566 people in * each of the 3 levels of interv* tab interv *two of the copies will be for computing the standardized result* *for these two copies (interv = 0 and interv = 1), set the outcome to missing * and force qsmk to either 0 or 1, respectively* *you may need to edit this part of the code for your outcome and exposure variables* replace wt82_71 = . if interv != -1 replace qsmk = 0 if interv == 0 replace qsmk = 1 if interv == 1 *check that the data has the structure you want: for interv = -1, some people * quit and some do not; for interv = 0 or 1, noone quits or everyone quits, respectively* by interv, sort: summarize qsmk *ii.Estimation in original sample* *Now, we do a parametric regression with the covariates we want to adjust for* *You may need to edit this part of the code for the variables you want.* *Because the copies have missing wt82_71, this will only run the regression in * the original copy* regress wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 qsmk#c.smokeintensity *Ask Stata for expected values - Stata will give you expected values for all * copies, not just the original ones* predict predY, xb *Now ask for a summary of these values by intervention* *These are the standardized outcome estimates: you can subtract them to get the * standardized difference* by interv, sort: summarize predY /* iii.OPTIONAL: Output standardized point estimates and difference - The summary from the last command gives you the standardized estimates - We can stop there, or we can ask Stata to calculate the standardized difference and display all the results in a simple table - The code below can be used as-is without changing any variable names - The option `quietly` asks Stata not to display the output of some intermediate calculations - You can delete this option if you want to see what is happening step-by-step */ quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) * Add some row/column descriptions and print results to screen matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe /* To interpret these results: - row 1, column 2, is the observed mean outcome value in our original sample - row 2, column 2, is the mean outcome value if everyone had not quit smoking - row 3, column 2, is the mean outcome value if everyone had quit smoking - row 4, column 2, is the mean difference outcome value if everyone had quit smoking compared to if everyone had not quit smoking */ /* Addition due to way Statamarkdown works i.e. each code chunk is a separate Stata session */ mata observe = st_matrix(&quot;observe&quot;) mata mata matsave ./data/observe observe, replace *drop the copies* drop if interv != -1 gen meanY_b =. qui save ./data/nhefs_std, replace (1,566 observations created) (1,566 observations created) (1,566 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 1,566 33.33 33.33 Original observation | 1,566 33.33 66.67 Duplicated observation | 1,566 33.33 100.00 -----------------------+----------------------------------- Total | 4,698 100.00 (3,132 real changes made, 3,132 to missing) (403 real changes made) (1,163 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 .2573436 .4373099 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 1 0 1 1 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(20, 1545) = 13.45 Model | 14412.558 20 720.6279 Prob &gt; F = 0.0000 Residual | 82763.0286 1,545 53.5683033 R-squared = 0.1483 -------------+---------------------------------- Adj R-squared = 0.1373 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.319 ------------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .9724486 4.14674 sex | -1.430272 .4689576 -3.05 0.002 -2.350132 -.5104111 race | .5601096 .5818888 0.96 0.336 -.5812656 1.701485 age | .3596353 .1633188 2.20 0.028 .0392854 .6799851 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094868 -.0027151 | education | 1 | .194977 .7413692 0.26 0.793 -1.259219 1.649173 2 | .9854211 .7012116 1.41 0.160 -.390006 2.360848 3 | .7512894 .6339153 1.19 0.236 -.4921358 1.994715 4 | 1.686547 .8716593 1.93 0.053 -.0232138 3.396307 | smokeintensity | .0491365 .0517254 0.95 0.342 -.052323 .1505959 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028306 .0008493 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045525 .3142621 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048944 .0011616 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.450114 .7422889 1 | -.0579374 .4316468 -0.13 0.893 -.904613 .7887381 | active | 0 | .2613779 .6845577 0.38 0.703 -1.081382 1.604138 1 | -.6861916 .6739131 -1.02 0.309 -2.008073 .6356894 | wt71 | .0455018 .0833709 0.55 0.585 -.1180303 .2090339 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019945 .0000639 | qsmk#| c.smokeintensity | Smoking cessation | .0466628 .0351448 1.33 0.184 -.0222737 .1155993 | _cons | -1.690608 4.388883 -0.39 0.700 -10.2994 6.918188 ------------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 2.6383 3.034683 -10.87582 9.876489 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 1.756213 2.826271 -11.83737 6.733498 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 5.273587 2.920532 -9.091126 11.0506 observe[4,2] interv value observed -1 2.6382998 E(Y(a=0)) 0 1.7562131 E(Y(a=1)) 1 5.2735873 difference . 3.5173742 (saving observe[4,2]) file ./data/observe.mmat saved (3,132 observations deleted) (1,566 missing values generated) Program 13.4 Computing the 95% confidence interval of the standardized means and their difference: Data from NHEFS Section 13.3 *Run program 13.3 to obtain point estimates, and then the code below* capture program drop bootstdz program define bootstdz, rclass use ./data/nhefs_std, clear preserve * Draw bootstrap sample from original observations bsample /* Create copies with each value of qsmk in bootstrap sample. First, duplicate the dataset and create a variable `interv` which indicates which copy is the duplicate (interv =1)*/ expand 2, generate(interv_b) /* Next, duplicate the original copy (interv = 0) again, and create another variable `interv2` to indicate the copy*/ expand 2 if interv_b == 0, generate(interv2_b) /* Now, change the value of interv to -1 in one of the copies so that there are unique values of interv for each copy*/ replace interv_b = -1 if interv2_b ==1 drop interv2_b /* Two of the copies will be for computing the standardized result. For these two copies (interv = 0 and interv = 1), set the outcome to missing and force qsmk to either 0 or 1, respectively*/ replace wt82_71 = . if interv_b != -1 replace qsmk = 0 if interv_b == 0 replace qsmk = 1 if interv_b == 1 * Run regression regress wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// qsmk#c.smokeintensity /* Ask Stata for expected values. Stata will give you expected values for all copies, not just the original ones*/ predict predY_b, xb summarize predY_b if interv_b == 0 return scalar boot_0 = r(mean) summarize predY_b if interv_b == 1 return scalar boot_1 = r(mean) return scalar boot_diff = return(boot_1) - return(boot_0) drop meanY_b restore end /* Then we use the `simulate` command to run the bootstraps as many times as we want. Start with reps(10) to make sure your code runs, and then change to reps(1000) to generate your final CIs.*/ simulate EY_a0=r(boot_0) EY_a1 = r(boot_1) /// difference = r(boot_diff), reps(10) seed(1): bootstdz /* Next, format the point estimate to allow Stata to calculate our standard errors and confidence intervals*/ * Addition: read back in the observe matrix mata mata matuse ./data/observe, replace mata st_matrix(&quot;observe&quot;, observe) matrix pe = observe[2..4, 2]&#39; matrix list pe /* Finally, the bstat command generates valid 95% confidence intervals under the normal approximation using our bootstrap results. The default results use a normal approximation to calcutlate the confidence intervals. Note, n contains the original sample size of your data before censoring*/ bstat, stat(pe) n(1629) 12. Command: bootstdz EY_a0: r(boot_0) EY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done (loading observe[4,2]) pe[1,3] r2 r3 r4 c2 1.7562131 5.2735873 3.5173742 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.756213 .2157234 8.14 0.000 1.333403 2.179023 EY_a1 | 5.273587 .4999001 10.55 0.000 4.293801 6.253374 difference | 3.517374 .538932 6.53 0.000 2.461087 4.573662 ------------------------------------------------------------------------------ "],["g-estimation-of-structural-nested-models-stata.html", "14. G-estimation of Structural Nested Models: Stata Program 14.1 Program 14.2 Program 14.3", " 14. G-estimation of Structural Nested Models: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 14.1 Ranks of extreme observations Data from NHEFS Section 14.4 /*For Stata 15 or later, first install the extremes function using this code:*/ * ssc install extremes *Data preprocessing*** use ./data/nhefs, clear gen byte cens = (wt82 == .) /*Ranking of extreme observations*/ extremes wt82_71 seqn /*Estimate unstabilized censoring weights for use in g-estimation models*/ glm cens qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// , family(binomial) predict pr_cens gen w_cens = 1/(1-pr_cens) replace w_cens = . if cens == 1 /*observations with cens = 1 contribute to censoring models but not outcome model*/ summarize w_cens /*Analyses restricted to N=1566*/ drop if wt82 == . summarize wt82_71 save ./data/nhefs-wcens, replace | obs: wt82_71 seqn | |------------------------------| | 1329. -41.28046982 23321 | | 527. -30.50192161 13593 | | 1515. -30.05007421 24363 | | 204. -29.02579305 5412 | | 1067. -25.97055814 21897 | +------------------------------+ +-----------------------------+ | 205. 34.01779932 5415 | | 1145. 36.96925111 22342 | | 64. 37.65051215 1769 | | 260. 47.51130337 6928 | | 1367. 48.53838568 23522 | +-----------------------------+ Iteration 0: Log likelihood = -292.45812 Iteration 1: Log likelihood = -233.5099 Iteration 2: Log likelihood = -232.68635 Iteration 3: Log likelihood = -232.68 Iteration 4: Log likelihood = -232.67999 Generalized linear models Number of obs = 1,629 Optimization : ML Residual df = 1,609 Scale parameter = 1 Deviance = 465.3599898 (1/df) Deviance = .2892231 Pearson = 1654.648193 (1/df) Pearson = 1.028371 Variance function: V(u) = u*(1-u) [Bernoulli] Link function : g(u) = ln(u/(1-u)) [Logit] AIC = .3102271 Log likelihood = -232.6799949 BIC = -11434.36 ----------------------------------------------------------------------------------- | OIM cens | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | .5168674 .2877162 1.80 0.072 -.0470459 1.080781 sex | .0573131 .3302775 0.17 0.862 -.590019 .7046452 race | -.0122715 .4524888 -0.03 0.978 -.8991332 .8745902 age | -.2697293 .1174647 -2.30 0.022 -.4999558 -.0395027 | c.age#c.age | .0028837 .0011135 2.59 0.010 .0007012 .0050661 | education | 1 | .3823818 .5601808 0.68 0.495 -.7155523 1.480316 2 | -.0584066 .5749586 -0.10 0.919 -1.185305 1.068491 3 | .2176937 .5225008 0.42 0.677 -.8063891 1.241776 4 | .5208288 .6678735 0.78 0.435 -.7881792 1.829837 | smokeintensity | .0157119 .0347319 0.45 0.651 -.0523614 .0837851 | c.smokeintensity#| c.smokeintensity | -.0001133 .0006058 -0.19 0.852 -.0013007 .0010742 | smokeyrs | .0785973 .0749576 1.05 0.294 -.068317 .2255116 | c.smokeyrs#| c.smokeyrs | -.0005569 .0010318 -0.54 0.589 -.0025791 .0014653 | exercise | 0 | .583989 .3723133 1.57 0.117 -.1457317 1.31371 1 | -.3874824 .3439133 -1.13 0.260 -1.06154 .2865753 | active | 0 | -.7065829 .3964577 -1.78 0.075 -1.483626 .0704599 1 | -.9540614 .3893181 -2.45 0.014 -1.717111 -.1910119 | wt71 | -.0878871 .0400115 -2.20 0.028 -.1663082 -.0094659 | c.wt71#c.wt71 | .0006351 .0002257 2.81 0.005 .0001927 .0010775 | _cons | 3.754678 2.651222 1.42 0.157 -1.441622 8.950978 ----------------------------------------------------------------------------------- (option mu assumed; predicted mean cens) (63 real changes made, 63 to missing) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- w_cens | 1,566 1.039197 .05646 1.001814 1.824624 (63 observations deleted) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt82_71 | 1,566 2.6383 7.879913 -41.28047 48.53839 file ./data/nhefs-wcens.dta saved Program 14.2 G-estimation of a 1-parameter structural nested mean model Brute force search Data from NHEFS Section 14.5 use ./data/nhefs-wcens, clear /*Generate test value of Psi = 3.446*/ gen psi = 3.446 /*Generate H(Psi) for each individual using test value of Psi and their own values of weight change and smoking status*/ gen Hpsi = wt82_71 - psi * qsmk /*Fit a model for smoking status, given confounders and H(Psi) value, with censoring weights and display H(Psi) coefficient*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 Hpsi /// [pw = w_cens], cluster(seqn) di _b[Hpsi] /*G-estimation*/ /*Checking multiple possible values of psi*/ cap noi drop psi Hpsi local seq_start = 2 local seq_end = 5 local seq_by = 0.1 // Setting seq_by = 0.01 will yield the result 3.46 local seq_len = (`seq_end&#39;-`seq_start&#39;)/`seq_by&#39; + 1 matrix results = J(`seq_len&#39;, 4, 0) qui gen psi = . qui gen Hpsi = . local j = 0 forvalues i = `seq_start&#39;(`seq_by&#39;)`seq_end&#39; { local j = `j&#39; + 1 qui replace psi = `i&#39; qui replace Hpsi = wt82_71 - psi * qsmk quietly logit qsmk sex race c.age##c.age /// ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 Hpsi /// [pw = w_cens], cluster(seqn) matrix p_mat = r(table) matrix p_mat = p_mat[&quot;pvalue&quot;,&quot;qsmk:Hpsi&quot;] local p = p_mat[1,1] local b = _b[Hpsi] di &quot;coeff&quot;, %6.3f `b&#39;, &quot;is generated from psi&quot;, %4.1f `i&#39; matrix results[`j&#39;,1]= `i&#39; matrix results[`j&#39;,2]= `b&#39; matrix results[`j&#39;,3]= abs(`b&#39;) matrix results[`j&#39;,4]= `p&#39; } matrix colnames results = &quot;psi&quot; &quot;B(Hpsi)&quot; &quot;AbsB(Hpsi)&quot; &quot;pvalue&quot; mat li results mata res = st_matrix(&quot;results&quot;) for(i=1; i&lt;= rows(res); i++) { if (res[i,3] == colmin(res[,3])) res[i,1] } end * Setting seq_by = 0.01 will yield the result 3.46 Iteration 0: Log pseudolikelihood = -936.10067 Iteration 1: Log pseudolikelihood = -879.13942 Iteration 2: Log pseudolikelihood = -877.82647 Iteration 3: Log pseudolikelihood = -877.82423 Iteration 4: Log pseudolikelihood = -877.82423 Logistic regression Number of obs = 1,566 Wald chi2(19) = 106.13 Prob &gt; chi2 = 0.0000 Log pseudolikelihood = -877.82423 Pseudo R2 = 0.0623 (Std. err. adjusted for 1,566 clusters in seqn) ----------------------------------------------------------------------------------- | Robust qsmk | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5137324 .1536024 -3.34 0.001 -.8147876 -.2126772 race | -.8608912 .2099415 -4.10 0.000 -1.272369 -.4494133 age | .1151589 .0502116 2.29 0.022 .016746 .2135718 | c.age#c.age | -.0007593 .0005297 -1.43 0.152 -.0017976 .000279 | education | 1 | -.4710855 .2247701 -2.10 0.036 -.9116268 -.0305441 2 | -.5000231 .2208583 -2.26 0.024 -.9328974 -.0671487 3 | -.3833788 .195914 -1.96 0.050 -.7673632 .0006056 4 | -.4047116 .2836068 -1.43 0.154 -.9605707 .1511476 | smokeintensity | -.0783425 .014645 -5.35 0.000 -.1070461 -.0496389 | c.smokeintensity#| c.smokeintensity | .0010722 .0002651 4.04 0.000 .0005526 .0015917 | smokeyrs | -.0711097 .026398 -2.69 0.007 -.1228488 -.0193705 | c.smokeyrs#| c.smokeyrs | .0008153 .0004491 1.82 0.069 -.000065 .0016955 | exercise | 0 | -.3800465 .1889205 -2.01 0.044 -.7503238 -.0097692 1 | -.0437043 .1372725 -0.32 0.750 -.3127534 .2253447 | active | 0 | -.2134552 .2122025 -1.01 0.314 -.6293645 .2024541 1 | -.1793327 .207151 -0.87 0.387 -.5853412 .2266758 | wt71 | -.0076607 .0256319 -0.30 0.765 -.0578983 .0425769 | c.wt71#c.wt71 | .0000866 .0001582 0.55 0.584 -.0002236 .0003967 | Hpsi | -1.90e-06 .0088414 -0.00 1.000 -.0173307 .0173269 _cons | -1.338367 1.359613 -0.98 0.325 -4.00316 1.326426 ----------------------------------------------------------------------------------- -1.905e-06 6. matrix p_mat = r(table) 7. matrix p_mat = p_mat[&quot;pvalue&quot;,&quot;qsmk:Hpsi&quot;] 8. local p = p_mat[1,1] 9. local b = _b[Hpsi] 10. di &quot;coeff&quot;, %6.3f `b&#39;, &quot;is generated from psi&quot;, %4.1f `i&#39; 11. matrix results[`j&#39;,1]= `i&#39; 12. matrix results[`j&#39;,2]= `b&#39; 13. matrix results[`j&#39;,3]= abs(`b&#39;) 14. matrix results[`j&#39;,4]= `p&#39; 15. } coeff 0.027 is generated from psi 2.0 coeff 0.025 is generated from psi 2.1 coeff 0.023 is generated from psi 2.2 coeff 0.021 is generated from psi 2.3 coeff 0.019 is generated from psi 2.4 coeff 0.018 is generated from psi 2.5 coeff 0.016 is generated from psi 2.6 coeff 0.014 is generated from psi 2.7 coeff 0.012 is generated from psi 2.8 coeff 0.010 is generated from psi 2.9 coeff 0.008 is generated from psi 3.0 coeff 0.006 is generated from psi 3.1 coeff 0.005 is generated from psi 3.2 coeff 0.003 is generated from psi 3.3 coeff 0.001 is generated from psi 3.4 coeff -0.001 is generated from psi 3.5 coeff -0.003 is generated from psi 3.6 coeff -0.005 is generated from psi 3.7 coeff -0.007 is generated from psi 3.8 coeff -0.009 is generated from psi 3.9 coeff -0.011 is generated from psi 4.0 coeff -0.012 is generated from psi 4.1 coeff -0.014 is generated from psi 4.2 coeff -0.016 is generated from psi 4.3 coeff -0.018 is generated from psi 4.4 coeff -0.020 is generated from psi 4.5 coeff -0.022 is generated from psi 4.6 coeff -0.024 is generated from psi 4.7 coeff -0.026 is generated from psi 4.8 coeff -0.028 is generated from psi 4.9 coeff -0.030 is generated from psi 5.0 results[31,4] psi B(Hpsi) AbsB(Hpsi) pvalue r1 2 .02672188 .02672188 .00177849 r2 2.1 .02489456 .02489456 .00359089 r3 2.2 .02306552 .02306552 .00698119 r4 2.3 .02123444 .02123444 .01305479 r5 2.4 .01940095 .01940095 .02346121 r6 2.5 .01756472 .01756472 .04049437 r7 2.6 .0157254 .0157254 .06710192 r8 2.7 .01388267 .01388267 .10673812 r9 2.8 .0120362 .0120362 .16301154 r10 2.9 .01018567 .01018567 .23912864 r11 3 .00833081 .00833081 .33720241 r12 3.1 .00647131 .00647131 .45757692 r13 3.2 .0046069 .0046069 .59835195 r14 3.3 .00273736 .00273736 .75528009 r15 3.4 .00086243 .00086243 .92212566 r16 3.5 -.00101809 .00101809 .90856559 r17 3.6 -.00290439 .00290439 .7444406 r18 3.7 -.00479666 .00479666 .59230593 r19 3.8 -.00669505 .00669505 .45731304 r20 3.9 -.00859969 .00859969 .3425138 r21 4 -.01051072 .01051072 .2488326 r22 4.1 -.01242824 .01242824 .17537691 r23 4.2 -.01435235 .01435235 .1199593 r24 4.3 -.01628313 .01628313 .07967563 r25 4.4 -.01822063 .01822063 .05142147 r26 4.5 -.02016492 .02016492 .03227271 r27 4.6 -.02211603 .02211603 .01971433 r28 4.7 -.02407401 .02407401 .01173271 r29 4.8 -.02603888 .02603888 .00680955 r30 4.9 -.02801063 .02801063 .00385828 r31 5 -.02998926 .02998926 .00213639 ------------------------------------------------- mata (type end to exit) ------------ : res = st_matrix(&quot;results&quot;) : for(i=1; i&lt;= rows(res); i++) { &gt; if (res[i,3] == colmin(res[,3])) res[i,1] &gt; } 3.4 : end -------------------------------------------------------------------------------------- Program 14.3 G-estimation for 2-parameter structural nested mean model Closed form estimator Data from NHEFS Section 14.6 use ./data/nhefs-wcens, clear /*create weights*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// [pw = w_cens], cluster(seqn) predict pr_qsmk summarize pr_qsmk /* Closed form estimator linear mean models **/ * ssc install tomata putmata *, replace mata: diff = qsmk - pr_qsmk mata: part1 = w_cens :* wt82_71 :* diff mata: part2 = w_cens :* qsmk :* diff mata: psi = sum(part1)/sum(part2) /*** Closed form estimator for 2-parameter model **/ mata diff = qsmk - pr_qsmk diff2 = w_cens :* diff lhs = J(2,2, 0) lhs[1,1] = sum( qsmk :* diff2) lhs[1,2] = sum( qsmk :* smokeintensity :* diff2 ) lhs[2,1] = sum( qsmk :* smokeintensity :* diff2) lhs[2,2] = sum( qsmk :* smokeintensity :* smokeintensity :* diff2 ) rhs = J(2,1,0) rhs[1] = sum(wt82_71 :* diff2 ) rhs[2] = sum(wt82_71 :* smokeintensity :* diff2 ) psi = (lusolve(lhs, rhs))&#39; psi psi = (invsym(lhs&#39;lhs)*lhs&#39;rhs)&#39; psi end Iteration 0: Log pseudolikelihood = -936.10067 Iteration 1: Log pseudolikelihood = -879.13943 Iteration 2: Log pseudolikelihood = -877.82647 Iteration 3: Log pseudolikelihood = -877.82423 Iteration 4: Log pseudolikelihood = -877.82423 Logistic regression Number of obs = 1,566 Wald chi2(18) = 106.13 Prob &gt; chi2 = 0.0000 Log pseudolikelihood = -877.82423 Pseudo R2 = 0.0623 (Std. err. adjusted for 1,566 clusters in seqn) ----------------------------------------------------------------------------------- | Robust qsmk | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5137295 .1533507 -3.35 0.001 -.8142913 -.2131677 race | -.8608919 .2099555 -4.10 0.000 -1.272397 -.4493867 age | .1151581 .0503079 2.29 0.022 .0165564 .2137598 | c.age#c.age | -.0007593 .00053 -1.43 0.152 -.0017981 .0002795 | education | 1 | -.4710854 .2247796 -2.10 0.036 -.9116454 -.0305255 2 | -.5000247 .220776 -2.26 0.024 -.9327378 -.0673116 3 | -.3833802 .1954991 -1.96 0.050 -.7665515 -.0002089 4 | -.4047148 .2833093 -1.43 0.153 -.9599908 .1505613 | smokeintensity | -.0783426 .0146634 -5.34 0.000 -.1070824 -.0496029 | c.smokeintensity#| c.smokeintensity | .0010722 .0002655 4.04 0.000 .0005518 .0015925 | smokeyrs | -.0711099 .0263523 -2.70 0.007 -.1227596 -.0194602 | c.smokeyrs#| c.smokeyrs | .0008153 .0004486 1.82 0.069 -.0000639 .0016945 | exercise | 0 | -.3800461 .1890123 -2.01 0.044 -.7505034 -.0095887 1 | -.0437044 .137269 -0.32 0.750 -.3127467 .225338 | active | 0 | -.2134564 .2121759 -1.01 0.314 -.6293135 .2024007 1 | -.1793322 .2070848 -0.87 0.386 -.5852109 .2265466 | wt71 | -.0076609 .0255841 -0.30 0.765 -.0578048 .042483 | c.wt71#c.wt71 | .0000866 .0001572 0.55 0.582 -.0002216 .0003947 | _cons | -1.338358 1.359289 -0.98 0.325 -4.002516 1.3258 ----------------------------------------------------------------------------------- (option pr assumed; Pr(qsmk)) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- pr_qsmk | 1,566 .2607709 .1177584 .0514466 .7891403 (68 vectors posted) ------------------------------------------------- mata (type end to exit) ------------ : diff = qsmk - pr_qsmk : diff2 = w_cens :* diff : : lhs = J(2,2, 0) : lhs[1,1] = sum( qsmk :* diff2) : lhs[1,2] = sum( qsmk :* smokeintensity :* diff2 ) : lhs[2,1] = sum( qsmk :* smokeintensity :* diff2) : lhs[2,2] = sum( qsmk :* smokeintensity :* smokeintensity :* diff2 ) : : rhs = J(2,1,0) : rhs[1] = sum(wt82_71 :* diff2 ) : rhs[2] = sum(wt82_71 :* smokeintensity :* diff2 ) : : psi = (lusolve(lhs, rhs))&#39; : psi 1 2 +-----------------------------+ 1 | 2.859470362 .0300412816 | +-----------------------------+ : psi = (invsym(lhs&#39;lhs)*lhs&#39;rhs)&#39; : psi 1 2 +-----------------------------+ 1 | 2.859470362 .0300412816 | +-----------------------------+ : end -------------------------------------------------------------------------------------- "],["outcome-regression-and-propensity-scores-stata.html", "15. Outcome regression and propensity scores: Stata Program 15.1 Prorgam 15.2 Program 15.3 Program 15.4", " 15. Outcome regression and propensity scores: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 15.1 Estimating the average causal effect within levels of confounders under the assumption of effect-measure modification by smoking intensity ONLY Data from NHEFS Section 15.1 use ./data/nhefs-formatted, clear /* Generate smoking intensity among smokers product term */ gen qsmkintensity = qsmk*smokeintensity * Regression on covariates, allowing for some effect modfication regress wt82_71 qsmk qsmkintensity /// c.smokeintensity##c.smokeintensity sex race c.age##c.age /// ib(last).education c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /* Display the estimated mean difference between quitting and not quitting value when smoke intensity = 5 cigarettes/ day */ lincom 1*_b[qsmk] + 5*1*_b[qsmkintensity] /* Display the estimated mean difference between quitting and not quitting value when smoke intensity = 40 cigarettes/ day */ lincom 1*_b[qsmk] + 40*1*_b[qsmkintensity] /* Regression on covariates, with no product terms */ regress wt82_71 qsmk c.smokeintensity##c.smokeintensity /// sex race c.age##c.age /// ib(last).education c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(20, 1545) = 13.45 Model | 14412.558 20 720.6279 Prob &gt; F = 0.0000 Residual | 82763.0286 1,545 53.5683033 R-squared = 0.1483 -------------+---------------------------------- Adj R-squared = 0.1373 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.319 ----------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .9724486 4.14674 qsmkintensity | .0466628 .0351448 1.33 0.184 -.0222737 .1155993 smokeintensity | .0491365 .0517254 0.95 0.342 -.052323 .1505959 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028306 .0008493 | sex | -1.430272 .4689576 -3.05 0.002 -2.350132 -.5104111 race | .5601096 .5818888 0.96 0.336 -.5812656 1.701485 age | .3596353 .1633188 2.20 0.028 .0392854 .6799851 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094868 -.0027151 | education | 1 | .194977 .7413692 0.26 0.793 -1.259219 1.649173 2 | .9854211 .7012116 1.41 0.160 -.390006 2.360848 3 | .7512894 .6339153 1.19 0.236 -.4921358 1.994715 4 | 1.686547 .8716593 1.93 0.053 -.0232138 3.396307 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045525 .3142621 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048944 .0011616 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.450114 .7422889 1 | -.0579374 .4316468 -0.13 0.893 -.904613 .7887381 | active | 0 | .2613779 .6845577 0.38 0.703 -1.081382 1.604138 1 | -.6861916 .6739131 -1.02 0.309 -2.008073 .6356894 | wt71 | .0455018 .0833709 0.55 0.585 -.1180303 .2090339 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019945 .0000639 | _cons | -1.690608 4.388883 -0.39 0.700 -10.2994 6.918188 ----------------------------------------------------------------------------------- ( 1) qsmk + 5*qsmkintensity = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 2.792908 .6682596 4.18 0.000 1.482117 4.1037 ------------------------------------------------------------------------------ ( 1) qsmk + 40*qsmkintensity = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 4.426108 .8477818 5.22 0.000 2.763183 6.089032 ------------------------------------------------------------------------------ Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(19, 1546) = 14.06 Model | 14318.1239 19 753.58547 Prob &gt; F = 0.0000 Residual | 82857.4627 1,546 53.5947365 R-squared = 0.1473 -------------+---------------------------------- Adj R-squared = 0.1369 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.3208 ----------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | 3.462622 .4384543 7.90 0.000 2.602594 4.32265 smokeintensity | .0651533 .0503115 1.29 0.196 -.0335327 .1638392 | c.smokeintensity#| c.smokeintensity | -.0010468 .0009373 -1.12 0.264 -.0028853 .0007918 | sex | -1.46505 .468341 -3.13 0.002 -2.3837 -.5463989 race | .5864117 .5816949 1.01 0.314 -.5545827 1.727406 age | .3626624 .1633431 2.22 0.027 .0422649 .6830599 | c.age#c.age | -.0061377 .0017263 -3.56 0.000 -.0095239 -.0027515 | education | 1 | .1708264 .7413289 0.23 0.818 -1.28329 1.624943 2 | .9893527 .7013784 1.41 0.159 -.3864007 2.365106 3 | .7423268 .6340357 1.17 0.242 -.501334 1.985988 4 | 1.679344 .8718575 1.93 0.054 -.0308044 3.389492 | smokeyrs | .1333931 .0917319 1.45 0.146 -.0465389 .3133252 | c.smokeyrs#| c.smokeyrs | -.001827 .0015438 -1.18 0.237 -.0048552 .0012012 | exercise | 0 | -.3628786 .5589557 -0.65 0.516 -1.45927 .7335129 1 | -.0421962 .4315904 -0.10 0.922 -.8887606 .8043683 | active | 0 | .2580374 .6847219 0.38 0.706 -1.085044 1.601119 1 | -.68492 .6740787 -1.02 0.310 -2.007125 .6372851 | wt71 | .0373642 .0831658 0.45 0.653 -.1257655 .200494 | c.wt71#c.wt71 | -.0009158 .0005235 -1.75 0.080 -.0019427 .0001111 | _cons | -1.724603 4.389891 -0.39 0.694 -10.33537 6.886166 ----------------------------------------------------------------------------------- Prorgam 15.2 Estimating and plotting the propensity score Data from NHEFS Section 15.2 use ./data/nhefs-formatted, clear /*Fit a model for the exposure, quitting smoking*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 /*Estimate the propensity score, P(Qsmk|Covariates)*/ predict ps, pr /*Check the distribution of the propensity score*/ bys qsmk: summarize ps /*Return extreme values of propensity score: note, for Stata versions 15 and above, start by installing extremes*/ * ssc install extremes extremes ps seqn bys qsmk: extremes ps seqn save ./data/nhefs-ps, replace /*Plotting the estimated propensity score*/ histogram ps, width(0.05) start(0.025) /// frequency fcolor(none) lcolor(black) /// lpattern(solid) addlabel /// addlabopts(mlabcolor(black) mlabposition(12) /// mlabangle(zero)) /// ytitle(No. Subjects) ylabel(#4) /// xtitle(Estimated Propensity Score) xlabel(#15) /// by(, title(Estimated Propensity Score Distribution) /// subtitle(By Quit Smoking Status)) /// by(, legend(off)) /// by(qsmk, style(compact) colfirst) /// subtitle(, size(small) box bexpand) qui gr export ./figs/stata-fig-15-2.png, replace Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- -------------------------------------------------------------------------------------- -&gt; qsmk = No smoking cessation Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 1,163 .2392928 .1056545 .0510008 .6814955 -------------------------------------------------------------------------------------- -&gt; qsmk = Smoking cessation Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 403 .3094353 .1290642 .0598799 .7768887 +--------------------------+ | obs: ps seqn | |--------------------------| | 979. .0510008 22941 | | 945. .0527126 1769 | | 1023. .0558418 21140 | | 115. .0558752 2522 | | 478. .0567372 12639 | +--------------------------+ +--------------------------+ | 1173. .6659576 22272 | | 1033. .6814955 22773 | | 1551. .7166381 14983 | | 1494. .7200644 24817 | | 1303. .7768887 24949 | +--------------------------+ -------------------------------------------------------------------------------------- -&gt; qsmk = No smoking cessation +--------------------------+ | obs: ps seqn | |--------------------------| | 979. .0510008 22941 | | 945. .0527126 1769 | | 1023. .0558418 21140 | | 115. .0558752 2522 | | 478. .0567372 12639 | +--------------------------+ +--------------------------+ | 463. .6337243 17096 | | 812. .6345721 17768 | | 707. .6440308 19147 | | 623. .6566707 21983 | | 1033. .6814955 22773 | +--------------------------+ -------------------------------------------------------------------------------------- -&gt; qsmk = Smoking cessation +--------------------------+ | obs: ps seqn | |--------------------------| | 1223. .0598799 4289 | | 1283. .0600822 23550 | | 1253. .0806089 24306 | | 1467. .0821677 22904 | | 1165. .1021875 24584 | +--------------------------+ +--------------------------+ | 1399. .635695 17738 | | 1173. .6659576 22272 | | 1551. .7166381 14983 | | 1494. .7200644 24817 | | 1303. .7768887 24949 | +--------------------------+ file ./data/nhefs-ps.dta saved Program 15.3 Stratification and outcome regression using deciles of the propensity score Data from NHEFS Section 15.3 Note: Stata decides borderline cutpoints differently from SAS, so, despite identically distributed propensity scores, the results of regression using deciles are not an exact match with the book. use ./data/nhefs-ps, clear /*Calculation of deciles of ps*/ xtile ps_dec = ps, nq(10) by ps_dec, sort: summarize ps /*Stratification on PS deciles, allowing for effect modification*/ /*Note: Stata compares qsmk 0 vs qsmk 1, so the coefficients are reversed relative to the book*/ by ps_dec: ttest wt82_71, by(qsmk) /*Regression on PS deciles, with no product terms*/ regress wt82_71 qsmk ib(last).ps_dec -&gt; ps_dec = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .0976251 .0185215 .0510008 .1240482 -------------------------------------------------------------------------------------- -&gt; ps_dec = 2 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .1430792 .0107751 .1241923 .1603558 -------------------------------------------------------------------------------------- -&gt; ps_dec = 3 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .1750423 .008773 .1606041 .1893271 -------------------------------------------------------------------------------------- -&gt; ps_dec = 4 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2014066 .0062403 .189365 .2121815 -------------------------------------------------------------------------------------- -&gt; ps_dec = 5 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .2245376 .0073655 .2123068 .237184 -------------------------------------------------------------------------------------- -&gt; ps_dec = 6 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2515298 .0078777 .2377578 .2655718 -------------------------------------------------------------------------------------- -&gt; ps_dec = 7 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2827476 .0099986 .2655724 .2994968 -------------------------------------------------------------------------------------- -&gt; ps_dec = 8 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .3204104 .0125102 .2997581 .3438773 -------------------------------------------------------------------------------------- -&gt; ps_dec = 9 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .375637 .0221347 .3439862 .4174631 -------------------------------------------------------------------------------------- -&gt; ps_dec = 10 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .5026508 .0733494 .4176717 .7768887 -------------------------------------------------------------------------------------- -&gt; ps_dec = 1 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 146 3.74236 .6531341 7.891849 2.451467 5.033253 Smoking | 11 3.949703 2.332995 7.737668 -1.248533 9.14794 ---------+-------------------------------------------------------------------- Combined | 157 3.756887 .6270464 7.856869 2.51829 4.995484 ---------+-------------------------------------------------------------------- diff | -.2073431 2.464411 -5.075509 4.660822 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -0.0841 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.4665 Pr(|T| &gt; |t|) = 0.9331 Pr(T &gt; t) = 0.5335 -------------------------------------------------------------------------------------- -&gt; ps_dec = 2 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 134 2.813019 .589056 6.818816 1.647889 3.978149 Smoking | 23 7.726944 1.260784 6.046508 5.112237 10.34165 ---------+-------------------------------------------------------------------- Combined | 157 3.532893 .5519826 6.916322 2.442569 4.623217 ---------+-------------------------------------------------------------------- diff | -4.913925 1.515494 -7.907613 -1.920237 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.2425 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0007 Pr(|T| &gt; |t|) = 0.0015 Pr(T &gt; t) = 0.9993 -------------------------------------------------------------------------------------- -&gt; ps_dec = 3 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 128 3.25684 .5334655 6.035473 2.201209 4.312472 Smoking | 28 7.954974 1.418184 7.504324 5.045101 10.86485 ---------+-------------------------------------------------------------------- Combined | 156 4.100095 .5245749 6.551938 3.063857 5.136334 ---------+-------------------------------------------------------------------- diff | -4.698134 1.318074 -7.301973 -2.094294 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.5644 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0002 Pr(|T| &gt; |t|) = 0.0005 Pr(T &gt; t) = 0.9998 -------------------------------------------------------------------------------------- -&gt; ps_dec = 4 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 121 3.393929 .5267602 5.794362 2.350981 4.436877 Smoking | 36 5.676072 1.543143 9.258861 2.543324 8.808819 ---------+-------------------------------------------------------------------- Combined | 157 3.917223 .5412091 6.78133 2.848179 4.986266 ---------+-------------------------------------------------------------------- diff | -2.282143 1.278494 -4.807663 .2433778 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -1.7850 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0381 Pr(|T| &gt; |t|) = 0.0762 Pr(T &gt; t) = 0.9619 -------------------------------------------------------------------------------------- -&gt; ps_dec = 5 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 119 1.368438 .8042619 8.773461 -.2242199 2.961095 Smoking | 37 5.195421 1.388723 8.44727 2.378961 8.011881 ---------+-------------------------------------------------------------------- Combined | 156 2.27612 .7063778 8.822656 .8807499 3.671489 ---------+-------------------------------------------------------------------- diff | -3.826983 1.637279 -7.061407 -.592559 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -2.3374 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0104 Pr(|T| &gt; |t|) = 0.0207 Pr(T &gt; t) = 0.9896 -------------------------------------------------------------------------------------- -&gt; ps_dec = 6 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 112 2.25564 .6850004 7.249362 .8982664 3.613014 Smoking | 45 7.199088 1.724899 11.57097 3.722782 10.67539 ---------+-------------------------------------------------------------------- Combined | 157 3.672552 .7146582 8.954642 2.260897 5.084207 ---------+-------------------------------------------------------------------- diff | -4.943447 1.535024 -7.975714 -1.911181 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.2204 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0008 Pr(|T| &gt; |t|) = 0.0016 Pr(T &gt; t) = 0.9992 -------------------------------------------------------------------------------------- -&gt; ps_dec = 7 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 116 .7948483 .7916172 8.525978 -.773193 2.36289 Smoking | 41 6.646091 1.00182 6.414778 4.621337 8.670844 ---------+-------------------------------------------------------------------- Combined | 157 2.32288 .6714693 8.413486 .9965349 3.649225 ---------+-------------------------------------------------------------------- diff | -5.851242 1.45977 -8.734853 -2.967632 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -4.0083 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0000 Pr(|T| &gt; |t|) = 0.0001 Pr(T &gt; t) = 1.0000 -------------------------------------------------------------------------------------- -&gt; ps_dec = 8 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 107 1.063848 .5840159 6.041107 -.0940204 2.221716 Smoking | 49 3.116263 1.113479 7.794356 .8774626 5.355063 ---------+-------------------------------------------------------------------- Combined | 156 1.708517 .5352016 6.684666 .6512864 2.765747 ---------+-------------------------------------------------------------------- diff | -2.052415 1.144914 -4.31418 .2093492 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -1.7926 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0375 Pr(|T| &gt; |t|) = 0.0750 Pr(T &gt; t) = 0.9625 -------------------------------------------------------------------------------------- -&gt; ps_dec = 9 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 100 -.0292906 .7637396 7.637396 -1.544716 1.486134 Smoking | 57 .9112647 .9969309 7.526663 -1.085828 2.908357 ---------+-------------------------------------------------------------------- Combined | 157 .3121849 .6054898 7.586766 -.8838316 1.508201 ---------+-------------------------------------------------------------------- diff | -.9405554 1.26092 -3.43136 1.550249 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -0.7459 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.2284 Pr(|T| &gt; |t|) = 0.4568 Pr(T &gt; t) = 0.7716 -------------------------------------------------------------------------------------- -&gt; ps_dec = 10 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 80 -.768504 .9224756 8.250872 -2.604646 1.067638 Smoking | 76 2.39532 1.053132 9.180992 .2973737 4.493267 ---------+-------------------------------------------------------------------- Combined | 156 .7728463 .7071067 8.831759 -.6239631 2.169656 ---------+-------------------------------------------------------------------- diff | -3.163824 1.396178 -5.921957 -.405692 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -2.2661 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0124 Pr(|T| &gt; |t|) = 0.0248 Pr(T &gt; t) = 0.9876 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(10, 1555) = 9.87 Model | 5799.7817 10 579.97817 Prob &gt; F = 0.0000 Residual | 91375.8049 1,555 58.7625755 R-squared = 0.0597 -------------+---------------------------------- Adj R-squared = 0.0536 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.6657 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.356927 .4580399 7.33 0.000 2.458486 4.255368 | ps_dec | 1 | 4.384269 .8873947 4.94 0.000 2.643652 6.124885 2 | 3.903694 .8805212 4.43 0.000 2.17656 5.630828 3 | 4.36015 .8793345 4.96 0.000 2.635343 6.084956 4 | 4.010061 .8745966 4.59 0.000 2.294548 5.725575 5 | 2.342505 .8754878 2.68 0.008 .6252438 4.059766 6 | 3.572955 .8714389 4.10 0.000 1.863636 5.282275 7 | 2.30881 .8727462 2.65 0.008 .5969261 4.020693 8 | 1.516677 .8715796 1.74 0.082 -.1929182 3.226273 9 | -.0439923 .8684465 -0.05 0.960 -1.747442 1.659457 | _cons | -.8625798 .6530529 -1.32 0.187 -2.143537 .4183773 ------------------------------------------------------------------------------ Program 15.4 Standardization and outcome regression using the propensity score Data from NHEFS Section 15.3 use ./data/nhefs-formatted, clear /*Estimate the propensity score*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 predict ps, pr /*Expand the dataset for standardization*/ expand 2, generate(interv) expand 2 if interv == 0, generate(interv2) replace interv = -1 if interv2 ==1 drop interv2 tab interv replace wt82_71 = . if interv != -1 replace qsmk = 0 if interv == 0 replace qsmk = 1 if interv == 1 by interv, sort: summarize qsmk /*Regression on the propensity score, allowing for effect modification*/ regress wt82_71 qsmk##c.ps predict predY, xb by interv, sort: summarize predY quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe /*bootstrap program*/ drop if interv != -1 gen meanY_b =. qui save ./data/nhefs_std, replace capture program drop bootstdz program define bootstdz, rclass use ./data/nhefs_std, clear preserve bsample /*Create 2 new copies of the data. Set the outcome AND the exposure to missing in the copies*/ expand 2, generate(interv_b) expand 2 if interv_b == 0, generate(interv2_b) qui replace interv_b = -1 if interv2_b ==1 qui drop interv2_b qui replace wt82_71 = . if interv_b != -1 qui replace qsmk = . if interv_b != -1 /*Fit the propensity score in the original data (where qsmk is not missing) and generate predictions for everyone*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 predict ps_b, pr /*Set the exposure to 0 for everyone in copy 0, and 1 to everyone for copy 1*/ qui replace qsmk = 0 if interv_b == 0 qui replace qsmk = 1 if interv_b == 1 /*Fit the outcome regression in the original data (where wt82_71 is not missing) and generate predictions for everyone*/ regress wt82_71 qsmk##c.ps predict predY_b, xb /*Summarize the predictions in each set of copies*/ summarize predY_b if interv_b == 0 return scalar boot_0 = r(mean) summarize predY_b if interv_b == 1 return scalar boot_1 = r(mean) return scalar boot_diff = return(boot_1) - return(boot_0) qui drop meanY_b restore end /*Then we use the `simulate` command to run the bootstraps as many times as we want. Start with reps(10) to make sure your code runs, and then change to reps(1000) to generate your final CIs*/ simulate EY_a0=r(boot_0) EY_a1 = r(boot_1) /// difference = r(boot_diff), reps(500) seed(1): bootstdz matrix pe = observe[2..4, 2]&#39; matrix list pe bstat, stat(pe) n(1629) estat bootstrap, p Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- (1,566 observations created) (1,566 observations created) (1,566 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 1,566 33.33 33.33 Original observation | 1,566 33.33 66.67 Duplicated observation | 1,566 33.33 100.00 -----------------------+----------------------------------- Total | 4,698 100.00 (3,132 real changes made, 3,132 to missing) (403 real changes made) (1,163 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 .2573436 .4373099 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 1 0 1 1 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(3, 1562) = 29.96 Model | 5287.31428 3 1762.43809 Prob &gt; F = 0.0000 Residual | 91888.2723 1,562 58.827319 R-squared = 0.0544 -------------+---------------------------------- Adj R-squared = 0.0526 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.6699 ------------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | Smoking cessation | 4.036457 1.13904 3.54 0.000 1.80225 6.270665 ps | -12.3319 2.129602 -5.79 0.000 -16.50908 -8.154716 | qsmk#c.ps | Smoking cessation | -2.038829 3.649684 -0.56 0.576 -9.197625 5.119967 | _cons | 4.935432 .5570216 8.86 0.000 3.842843 6.028021 ------------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 2.6383 1.838063 -3.4687 8.111371 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 1.761898 1.433264 -4.645079 4.306496 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 5.273676 1.670225 -2.192565 8.238971 observe[4,2] interv value observed -1 2.6382998 E(Y(a=0)) 0 1.7618979 E(Y(a=1)) 1 5.2736757 difference . 3.5117778 (3,132 observations deleted) (1,566 missing values generated) 11. predict ps_b, pr 12. Command: bootstdz EY_a0: r(boot_0) EY_a1: r(boot_1) difference: r(boot_diff) Simulations (500): .........10.........20.........30.........40.........50.........60. &gt; ........70.........80.........90.........100.........110.........120.........130.... &gt; .....140.........150.........160.........170.........180.........190.........200.... &gt; .....210.........220.........230.........240.........250.........260.........270.... &gt; .....280.........290.........300.........310.........320.........330.........340.... &gt; .....350.........360.........370.........380.........390.........400.........410.... &gt; .....420.........430.........440.........450.........460.........470.........480.... &gt; .....490.........500 done pe[1,3] E(Y(a=0)) E(Y(a=1)) difference value 1.7618979 5.2736757 3.5117778 Bootstrap results Number of obs = 1,629 Replications = 500 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.761898 .2255637 7.81 0.000 1.319801 2.203995 EY_a1 | 5.273676 .4695378 11.23 0.000 4.353399 6.193953 difference | 3.511778 .4970789 7.06 0.000 2.537521 4.486035 ------------------------------------------------------------------------------ Bootstrap results Number of obs = 1,629 Replications = 500 ------------------------------------------------------------------------------ | Observed Bootstrap | coefficient Bias std. err. [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.7618979 .0026735 .22556365 1.269908 2.186845 (P) EY_a1 | 5.2736757 -.0049491 .46953779 4.34944 6.109205 (P) difference | 3.5117778 -.0076226 .49707894 2.466025 4.424034 (P) ------------------------------------------------------------------------------ Key: P: Percentile "],["instrumental-variables-estimation-stata.html", "16. Instrumental variables estimation: Stata Program 16.1 Program 16.2 Program 16.3 Program 16.4 Program 16.5", " 16. Instrumental variables estimation: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 16.1 Estimating the average causal effect using the standard IV estimator via the calculation of sample averages Data from NHEFS Section 16.2 use ./data/nhefs-formatted, clear summarize price82 /* ignore subjects with missing outcome or missing instrument for simplicity*/ foreach var of varlist wt82 price82 { drop if `var&#39;==. } /*Create categorical instrument*/ gen byte highprice = (price82 &gt; 1.5 &amp; price82 &lt; .) save ./data/nhefs-highprice, replace /*Calculate P[Z|A=a]*/ tab highprice qsmk, row /*Calculate P[Y|Z=z]*/ ttest wt82_71, by(highprice) /*Final IV estimate, OPTION 1: Hand calculations*/ /*Numerator: num = E[Y|Z=1] - E[Y|Z=0] = 2.686 - 2.536 = 0.150*/ /*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = 0.258 - 0.195 = 0.063 */ /*IV estimator: E[Ya=1] - E[Ya=0] = (E[Y|Z=1]-E[Y|Z=0])/(P[A=1|Z=1]-P[A=1|Z=0]) = 0.150/0.063 = 2.397*/ display &quot;Numerator, E[Y|Z=1] - E[Y|Z=0] =&quot;, 2.686 - 2.536 display &quot;Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] =&quot;, 0.258 - 0.195 display &quot;IV estimator =&quot;, 0.150/0.063 /*OPTION 2 2: automated calculation of instrument*/ /*Calculate P[A=1|Z=z], for each value of the instrument, and store in a matrix*/ quietly summarize qsmk if (highprice==0) matrix input pa = (`r(mean)&#39;) quietly summarize qsmk if (highprice==1) matrix pa = (pa ,`r(mean)&#39;) matrix list pa /*Calculate P[Y|Z=z], for each value of the instrument, and store in a second matrix*/ quietly summarize wt82_71 if (highprice==0) matrix input ey = (`r(mean)&#39;) quietly summarize wt82_71 if (highprice==1) matrix ey = (ey ,`r(mean)&#39;) matrix list ey /*Using Stata&#39;s built-in matrix manipulation feature (Mata), calculate numerator, denominator and IV estimator*/ *Numerator: num = E[Y|Z=1] - E[Y|Z=0]*mata *Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0]* *IV estimator: iv_est = IV estimate of E[Ya=1] - E[Ya=0] * mata pa = st_matrix(&quot;pa&quot;) ey = st_matrix(&quot;ey&quot;) num = ey[1,2] - ey[1,1] denom = pa[1,2] - pa[1,1] iv_est = num / denom num denom st_numscalar(&quot;iv_est&quot;, iv_est) end di scalar(iv_est) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- price82 | 1,476 1.805989 .1301703 1.451904 2.103027 (0 observations deleted) (90 observations deleted) file ./data/nhefs-highprice.dta saved +----------------+ | Key | |----------------| | frequency | | row percentage | +----------------+ | quit smoking between | baseline and 1982 highprice | No smokin Smoking c | Total -----------+----------------------+---------- 0 | 33 8 | 41 | 80.49 19.51 | 100.00 -----------+----------------------+---------- 1 | 1,065 370 | 1,435 | 74.22 25.78 | 100.00 -----------+----------------------+---------- Total | 1,098 378 | 1,476 | 74.39 25.61 | 100.00 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- 0 | 41 2.535729 1.461629 9.358993 -.4183336 5.489792 1 | 1,435 2.686018 .2084888 7.897848 2.277042 3.094994 ---------+-------------------------------------------------------------------- Combined | 1,476 2.681843 .2066282 7.938395 2.276527 3.087159 ---------+-------------------------------------------------------------------- diff | -.1502887 1.257776 -2.617509 2.316932 ------------------------------------------------------------------------------ diff = mean(0) - mean(1) t = -0.1195 H0: diff = 0 Degrees of freedom = 1474 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.4525 Pr(|T| &gt; |t|) = 0.9049 Pr(T &gt; t) = 0.5475 Numerator, E[Y|Z=1] - E[Y|Z=0] = .15 Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = .063 IV estimator = 2.3809524 pa[1,2] c1 c2 r1 .19512195 .25783972 ey[1,2] c1 c2 r1 2.535729 2.6860178 ------------------------------------------------- mata (type end to exit) ------------ : pa = st_matrix(&quot;pa&quot;) : ey = st_matrix(&quot;ey&quot;) : num = ey[1,2] - ey[1,1] : denom = pa[1,2] - pa[1,1] : iv_est = num / denom : num .1502887173 : denom .06271777 : st_numscalar(&quot;iv_est&quot;, iv_est) : end -------------------------------------------------------------------------------------- 2.3962701 Program 16.2 Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression Data from NHEFS Section 16.2 use ./data/nhefs-highprice, clear /* ivregress fits the model in two stages: - first model: qsmk = highprice - second model: wt82_71 = predicted_qsmk */ ivregress 2sls wt82_71 (qsmk = highprice) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.01 Prob &gt; chi2 = 0.9038 R-squared = 0.0213 Root MSE = 7.8508 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 2.39627 19.82659 0.12 0.904 -36.46313 41.25567 _cons | 2.068164 5.081652 0.41 0.684 -7.89169 12.02802 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice Program 16.3 Estimating the average causal effect using the standard IV estimator via an additive marginal structural model Data from NHEFS Checking one possible value of psi. See Chapter 14 for program that checks several values and computes 95% confidence intervals Section 16.2 use ./data/nhefs-highprice, clear gen psi = 2.396 gen hspi = wt82_71 - psi*qsmk logit highprice hspi Iteration 0: Log likelihood = -187.34948 Iteration 1: Log likelihood = -187.34948 Logistic regression Number of obs = 1,476 LR chi2(1) = 0.00 Prob &gt; chi2 = 1.0000 Log likelihood = -187.34948 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ highprice | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- hspi | 2.75e-07 .0201749 0.00 1.000 -.0395419 .0395424 _cons | 3.555347 .1637931 21.71 0.000 3.234319 3.876376 ------------------------------------------------------------------------------ Program 16.4 Estimating the average causal effect using the standard IV estimator based on alternative proposed instruments Data from NHEFS Section 16.5 use ./data/nhefs-highprice, clear /*Instrument cut-point: 1.6*/ replace highprice = . replace highprice = (price82 &gt;1.6 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.7*/ replace highprice = . replace highprice = (price82 &gt;1.7 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.8*/ replace highprice = . replace highprice = (price82 &gt;1.8 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.9*/ replace highprice = . replace highprice = (price82 &gt;1.9 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.06 Prob &gt; chi2 = 0.8023 R-squared = . Root MSE = 18.593 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 41.28124 164.8417 0.25 0.802 -281.8026 364.365 _cons | -7.890182 42.21833 -0.19 0.852 -90.63659 74.85623 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.05 Prob &gt; chi2 = 0.8274 R-squared = . Root MSE = 20.577 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -40.91185 187.6162 -0.22 0.827 -408.6328 326.8091 _cons | 13.15927 48.05103 0.27 0.784 -81.01901 107.3375 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.55 Prob &gt; chi2 = 0.4576 R-squared = . Root MSE = 13.01 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -21.10342 28.40885 -0.74 0.458 -76.78374 34.57691 _cons | 8.086377 7.283314 1.11 0.267 -6.188657 22.36141 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.29 Prob &gt; chi2 = 0.5880 R-squared = . Root MSE = 10.357 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -12.81141 23.65099 -0.54 0.588 -59.16649 33.54368 _cons | 5.962813 6.062956 0.98 0.325 -5.920362 17.84599 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice Program 16.5 Estimating the average causal effect using the standard IV estimator conditional on baseline covariates Data from NHEFS Section 16.5 use ./data/nhefs-highprice, clear replace highprice = . replace highprice = (price82 &gt;1.5 &amp; price82 &lt; .) ivregress 2sls wt82_71 sex race c.age c.smokeintensity /// c.smokeyrs i.exercise i.active c.wt7 /// (qsmk = highprice) (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(11) = 135.18 Prob &gt; chi2 = 0.0000 R-squared = 0.0622 Root MSE = 7.6848 -------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ---------------+---------------------------------------------------------------- qsmk | -1.042295 29.86522 -0.03 0.972 -59.57705 57.49246 sex | -1.644393 2.620115 -0.63 0.530 -6.779724 3.490938 race | -.1832546 4.631443 -0.04 0.968 -9.260716 8.894207 age | -.16364 .2395678 -0.68 0.495 -.6331844 .3059043 smokeintensity | .0057669 .144911 0.04 0.968 -.2782534 .2897872 smokeyrs | .0258357 .1607639 0.16 0.872 -.2892558 .3409271 | exercise | 1 | .4987479 2.162395 0.23 0.818 -3.739469 4.736964 2 | .5818337 2.174255 0.27 0.789 -3.679628 4.843296 | active | 1 | -1.170145 .6049921 -1.93 0.053 -2.355908 .0156176 2 | -.5122842 1.303121 -0.39 0.694 -3.066355 2.041787 | wt71 | -.0979493 .036123 -2.71 0.007 -.168749 -.0271496 _cons | 17.28033 2.32589 7.43 0.000 12.72167 21.83899 -------------------------------------------------------------------------------- Endogenous: qsmk Exogenous: sex race age smokeintensity smokeyrs 1.exercise 2.exercise 1.active 2.active wt71 highprice "],["causal-survival-analysis-stata.html", "17. Causal survival analysis: Stata Program 17.1 Program 17.2 Program 17.3 Program 17.4", " 17. Causal survival analysis: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 17.1 Nonparametric estimation of survival curves Data from NHEFS Section 17.1 use ./data/nhefs-formatted, clear /*Some preprocessing of the data*/ gen survtime = . replace survtime = 120 if death == 0 replace survtime = (yrdth - 83)*12 + modth if death ==1 * yrdth ranges from 83 to 92* tab death qsmk /*Kaplan-Meier graph of observed survival over time, by quitting smoking*/ *For now, we use the stset function in Stata* stset survtime, failure(death=1) sts graph, by(qsmk) xlabel(0(12)120) qui gr export ./figs/stata-fig-17-1.png, replace (1,566 missing values generated) (1,275 real changes made) (291 real changes made) death | between | quit smoking between 1983 and | baseline and 1982 1992 | No smokin Smoking c | Total -----------+----------------------+---------- 0 | 963 312 | 1,275 1 | 200 91 | 291 -----------+----------------------+---------- Total | 1,163 403 | 1,566 Survival-time data settings Failure event: death==1 Observed time interval: (0, survtime] Exit on or before: failure -------------------------------------------------------------------------- 1,566 total observations 0 exclusions -------------------------------------------------------------------------- 1,566 observations remaining, representing 291 failures in single-record/single-failure data 171,076 total analysis time at risk and under observation At risk from t = 0 Earliest observed entry t = 0 Last observed exit t = 120 Failure _d: death==1 Analysis time _t: survtime Program 17.2 Parametric estimation of survival curves via hazards model Data from NHEFS Section 17.1 Generates Figure 17.4 /**Create person-month dataset for survival analyses**/ /* We want our new dataset to include 1 observation per person per month alive, starting at time = 0. Individuals who survive to the end of follow-up will have 119 time points Individuals who die will have survtime - 1 time points*/ use ./data/nhefs-formatted, clear gen survtime = . replace survtime = 120 if death == 0 replace survtime = (yrdth - 83)*12 + modth if death ==1 *expand data to person-time* gen time = 0 expand survtime if time == 0 bysort seqn: replace time = _n - 1 *Create event variable* gen event = 0 replace event = 1 if time == survtime - 1 &amp; death == 1 tab event *Create time-squared variable for analyses* gen timesq = time*time *Save the dataset to your working directory for future use* qui save ./data/nhefs_surv, replace /**Hazard ratios**/ use ./data/nhefs_surv, clear *Fit a pooled logistic hazards model * logistic event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time /**Survival curves: run regression then do:**/ *Create a dataset with all time points under each treatment level* *Re-expand data with rows for all timepoints* drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 /*Create 2 copies of each subject, and set outcome to missing and treatment -- use only the newobs*/ expand 2 , generate(interv) replace qsmk = interv /*Generate predicted event and survival probabilities for each person each month in copies*/ predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k *Within copies, generate predicted survival over time* *Remember, survival is the product of conditional survival probabilities in each interval* sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 *Display 10-year standardized survival, under interventions* *Note: since time starts at 0, month 119 is 10-year survival* by interv, sort: summarize psurv if time == 119 *Graph of standardized survival over time, under interventions* /*Note, we want our graph to start at 100% survival, so add an extra time point with P(surv) = 1*/ expand 2 if time ==0, generate(newtime) replace psurv = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 /*Separate the survival probabilities to allow plotting by intervention on qsmk*/ separate psurv, by(interv) *Plot the curves* twoway (line psurv0 time2, sort) /// (line psurv1 time2, sort) if interv &gt; -1 /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) qui gr export ./figs/stata-fig-17-2.png, replace (1,566 missing values generated) (1,275 real changes made) (291 real changes made) (169,510 observations created) (169510 real changes made) (291 real changes made) event | Freq. Percent Cum. ------------+----------------------------------- 0 | 170,785 99.83 99.83 1 | 291 0.17 100.00 ------------+----------------------------------- Total | 171,076 100.00 Logistic regression Number of obs = 171,076 LR chi2(5) = 24.26 Prob &gt; chi2 = 0.0002 Log likelihood = -2134.1973 Pseudo R2 = 0.0057 ------------------------------------------------------------------------------------ event | Odds ratio Std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 1.402527 .6000025 0.79 0.429 .6064099 3.243815 | qsmk#c.time | Smoking cessation | 1.012318 .0162153 0.76 0.445 .9810299 1.044603 | qsmk#c.time#c.time | Smoking cessation | .9998342 .0001321 -1.25 0.210 .9995753 1.000093 | time | 1.022048 .0090651 2.46 0.014 1.004434 1.039971 | c.time#c.time | .9998637 .0000699 -1.95 0.051 .9997266 1.000001 | _cons | .0007992 .0001972 -28.90 0.000 .0004927 .0012963 ------------------------------------------------------------------------------------ Note: _cons estimates baseline odds. (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8279829 0 .8279829 .8279829 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .774282 0 .774282 .774282 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- psurv0 float %9.0g psurv, interv == Original observation psurv1 float %9.0g psurv, interv == Duplicated observation Program 17.3 Estimation of survival curves via IP weighted hazards model Data from NHEFS Section 17.4 Generates Figure 17.6 use ./data/nhefs_surv, clear keep seqn event qsmk time sex race age education /// smokeintensity smkintensity82_71 smokeyrs /// exercise active wt71 preserve *Estimate weights* logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 if time == 0 predict p_qsmk, pr logit qsmk if time ==0 predict num, pr gen sw=num/p_qsmk if qsmk==1 replace sw=(1-num)/(1-p_qsmk) if qsmk==0 summarize sw *IP weighted survival by smoking cessation* logit event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time [pweight=sw] , cluster(seqn) *Create a dataset with all time points under each treatment level* *Re-expand data with rows for all timepoints* drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 /*Create 2 copies of each subject, and set outcome to missing and treatment -- use only the newobs*/ expand 2 , generate(interv) replace qsmk = interv /*Generate predicted event and survival probabilities for each person each month in copies*/ predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k *Within copies, generate predicted survival over time* /*Remember, survival is the product of conditional survival probabilities in each interval*/ sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 *Display 10-year standardized survival, under interventions* *Note: since time starts at 0, month 119 is 10-year survival* by interv, sort: summarize psurv if time == 119 quietly summarize psurv if(interv==0 &amp; time ==119) matrix input observe = (0,`r(mean)&#39;) quietly summarize psurv if(interv==1 &amp; time ==119) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\3, observe[2,2]-observe[1,2]) matrix list observe *Graph of standardized survival over time, under interventions* /*Note: since our outcome model has no covariates, we can plot psurv directly. If we had covariates we would need to stratify or average across the values*/ expand 2 if time ==0, generate(newtime) replace psurv = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 separate psurv, by(interv) twoway (line psurv0 time2, sort) /// (line psurv1 time2, sort) if interv &gt; -1 /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) qui gr export ./figs/stata-fig-17-3.png, replace *remove extra timepoint* drop if newtime == 1 drop time2 restore **Bootstraps** qui save ./data/nhefs_std1 , replace capture program drop bootipw_surv program define bootipw_surv , rclass use ./data/nhefs_std1 , clear preserve bsample, cluster(seqn) idcluster(newseqn) logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 if time == 0 predict p_qsmk, pr logit qsmk if time ==0 predict num, pr gen sw=num/p_qsmk if qsmk==1 replace sw=(1-num)/(1-p_qsmk) if qsmk==0 logit event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time [pweight=sw], cluster(newseqn) drop if time != 0 expand 120 if time ==0 bysort newseqn: replace time = _n - 1 expand 2 , generate(interv_b) replace qsmk = interv_b predict pevent_k, pr gen psurv_k = 1-pevent_k keep newseqn time qsmk interv_b psurv_k sort newseqn interv_b time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort newseqn interv_b: /// replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 drop if time != 119 bysort interv_b: egen meanS_b = mean(psurv) keep newseqn qsmk meanS_b drop if newseqn != 1 /* only need one pair */ drop newseqn return scalar boot_0 = meanS_b[1] return scalar boot_1 = meanS_b[2] return scalar boot_diff = return(boot_1) - return(boot_0) restore end set rmsg on simulate PrY_a0 = r(boot_0) PrY_a1 = r(boot_1) /// difference=r(boot_diff), reps(10) seed(1): bootipw_surv set rmsg off matrix pe = observe[1..3, 2]&#39; bstat, stat(pe) n(1629) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = -0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = -0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (128,481 missing values generated) (128,481 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw | 171,076 1.000509 .2851505 .3312489 4.297662 Iteration 0: Log pseudolikelihood = -2136.3671 Iteration 1: Log pseudolikelihood = -2127.0974 Iteration 2: Log pseudolikelihood = -2126.8556 Iteration 3: Log pseudolikelihood = -2126.8554 Logistic regression Number of obs = 171,076 Wald chi2(5) = 22.74 Prob &gt; chi2 = 0.0004 Log pseudolikelihood = -2126.8554 Pseudo R2 = 0.0045 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------------ | Robust event | Coefficient std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | -.1301273 .4186673 -0.31 0.756 -.9507002 .6904456 | qsmk#c.time | Smoking cessation | .01916 .0151318 1.27 0.205 -.0104978 .0488178 | qsmk#c.time#c.time | Smoking cessation | -.0002152 .0001213 -1.77 0.076 -.0004528 .0000225 | time | .0208179 .0077769 2.68 0.007 .0055754 .0360604 | c.time#c.time | -.0001278 .0000643 -1.99 0.047 -.0002537 -1.84e-06 | _cons | -7.038847 .2142855 -32.85 0.000 -7.458839 -6.618855 ------------------------------------------------------------------------------------ (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8161003 0 .8161003 .8161003 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8116784 0 .8116784 .8116784 observe[3,2] c1 c2 r1 0 .8161003 r2 1 .81167841 r3 3 -.00442189 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- psurv0 float %9.0g psurv, interv == Original observation psurv1 float %9.0g psurv, interv == Duplicated observation (3,132 observations deleted) 5. predict p_qsmk, pr 6. 11. 23. drop if time != 119 24. bysort interv_b: egen meanS_b = mean(psurv) 25. keep newseqn qsmk meanS_b 26. drop if newseqn != 1 /* only need one pair */ 27. r; t=0.00 14:49:11 Command: bootipw_surv PrY_a0: r(boot_0) PrY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done r; t=17.53 14:49:28 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- PrY_a0 | .8161003 .0093124 87.64 0.000 .7978484 .8343522 PrY_a1 | .8116784 .0237581 34.16 0.000 .7651133 .8582435 difference | -.0044219 .0225007 -0.20 0.844 -.0485224 .0396786 ------------------------------------------------------------------------------ Program 17.4 Estimating of survival curves via g-formula Data from NHEFS Section 17.5 Generates Figure 17.7 use ./data/nhefs_surv, clear keep seqn event qsmk time sex race age education /// smokeintensity smkintensity82_71 smokeyrs exercise /// active wt71 preserve quietly logistic event qsmk qsmk#c.time /// qsmk#c.time#c.time time c.time#c.time /// sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 , cluster(seqn) drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 expand 2 , generate(interv) replace qsmk = interv predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 by interv, sort: summarize psurv if time == 119 keep qsmk interv psurv time bysort interv : egen meanS = mean(psurv) if time == 119 by interv: summarize meanS quietly summarize meanS if(qsmk==0 &amp; time ==119) matrix input observe = ( 0,`r(mean)&#39;) quietly summarize meanS if(qsmk==1 &amp; time ==119) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\2, observe[2,2]-observe[1,2]) *Add some row/column descriptions and print results to screen* matrix rownames observe = P(Y(a=0)=1) P(Y(a=1)=1) difference matrix colnames observe = interv survival *Graph standardized survival over time, under interventions* /*Note: unlike in Program 17.3, we now have covariates so we first need to average survival across strata*/ bysort interv time : egen meanS_t = mean(psurv) *Now we can continue with the graph* expand 2 if time ==0, generate(newtime) replace meanS_t = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 separate meanS_t, by(interv) twoway (line meanS_t0 time2, sort) /// (line meanS_t1 time2, sort) /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) gr export ./figs/stata-fig-17-4.png, replace *remove extra timepoint* drop if newtime == 1 restore *Bootstraps* qui save ./data/nhefs_std2 , replace capture program drop bootstdz_surv program define bootstdz_surv , rclass use ./data/nhefs_std2 , clear preserve bsample, cluster(seqn) idcluster(newseqn) logistic event qsmk qsmk#c.time qsmk#c.time#c.time /// time c.time#c.time /// sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smkintensity82_71 /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 drop if time != 0 /*only predict on new version of data */ expand 120 if time ==0 bysort newseqn: replace time = _n - 1 expand 2 , generate(interv_b) replace qsmk = interv_b predict pevent_k, pr gen psurv_k = 1-pevent_k keep newseqn time qsmk psurv_k sort newseqn qsmk time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort newseqn qsmk: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 drop if time != 119 /* keep only last observation */ keep newseqn qsmk psurv /* if time is in data for complete graph add time to bysort */ bysort qsmk : egen meanS_b = mean(psurv) keep newseqn qsmk meanS_b drop if newseqn != 1 /* only need one pair */ drop newseqn return scalar boot_0 = meanS_b[1] return scalar boot_1 = meanS_b[2] return scalar boot_diff = return(boot_1) - return(boot_0) restore end set rmsg on simulate PrY_a0 = r(boot_0) PrY_a1 = r(boot_1) /// difference=r(boot_diff), reps(10) seed(1): bootstdz_surv set rmsg off matrix pe = observe[1..3, 2]&#39; bstat, stat(pe) n(1629) (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8160697 .2014345 .014127 .9903372 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .811763 .2044758 .0123403 .9900259 (372,708 missing values generated) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanS | 1,566 .8160697 0 .8160697 .8160697 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanS | 1,566 .8117629 0 .8117629 .8117629 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- meanS_t0 float %9.0g meanS_t, interv == Original observation meanS_t1 float %9.0g meanS_t, interv == Duplicated observation file /Users/eptmp/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG format (3,132 observations deleted) 5. drop if time != 0 6. /*only predict on new version of data */ r; t=0.00 14:49:35 Command: bootstdz_surv PrY_a0: r(boot_0) PrY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done r; t=22.22 14:49:57 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- PrY_a0 | .8160697 .0087193 93.59 0.000 .7989802 .8331593 PrY_a1 | .8117629 .0292177 27.78 0.000 .7544973 .8690286 difference | -.0043068 .0307674 -0.14 0.889 -.0646099 .0559963 ------------------------------------------------------------------------------ "],["session-information-stata.html", "Session information: Stata", " Session information: Stata library(Statamarkdown) For reproducibility. about Stata/MP 18.0 for Mac (Apple Silicon) Revision 04 Apr 2024 Copyright 1985-2023 StataCorp LLC Total physical memory: 18.00 GB Stata license: Unlimited-user 2-core network, expiring 29 Jan 2025 Serial number: 501809305331 Licensed to: Tom Palmer University of Bristol # install.packages(&quot;sessioninfo&quot;) sessioninfo::session_info() #&gt; ─ Session info ─────────────────────────────────────────────────────────────── #&gt; setting value #&gt; version R version 4.4.0 (2024-04-24) #&gt; os macOS Sonoma 14.4.1 #&gt; system aarch64, darwin20 #&gt; ui X11 #&gt; language (EN) #&gt; collate en_US.UTF-8 #&gt; ctype en_US.UTF-8 #&gt; tz Europe/London #&gt; date 2024-04-25 #&gt; pandoc 3.1.13 @ /opt/homebrew/bin/ (via rmarkdown) #&gt; #&gt; ─ Packages ─────────────────────────────────────────────────────────────────── #&gt; package * version date (UTC) lib source #&gt; bookdown 0.39 2024-04-15 [1] CRAN (R 4.4.0) #&gt; bslib 0.7.0 2024-03-29 [1] CRAN (R 4.4.0) #&gt; cachem 1.0.8 2023-05-01 [1] CRAN (R 4.4.0) #&gt; cli 3.6.2 2023-12-11 [1] CRAN (R 4.4.0) #&gt; digest 0.6.35 2024-03-11 [1] CRAN (R 4.4.0) #&gt; evaluate 0.23 2023-11-01 [1] CRAN (R 4.4.0) #&gt; fastmap 1.1.1 2023-02-24 [1] CRAN (R 4.4.0) #&gt; htmltools 0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0) #&gt; jquerylib 0.1.4 2021-04-26 [1] CRAN (R 4.4.0) #&gt; jsonlite 1.8.8 2023-12-04 [1] CRAN (R 4.4.0) #&gt; knitr 1.46 2024-04-06 [1] CRAN (R 4.4.0) #&gt; lifecycle 1.0.4 2023-11-07 [1] CRAN (R 4.4.0) #&gt; R6 2.5.1 2021-08-19 [1] CRAN (R 4.4.0) #&gt; rlang 1.1.3 2024-01-10 [1] CRAN (R 4.4.0) #&gt; rmarkdown 2.26 2024-03-05 [1] CRAN (R 4.4.0) #&gt; rstudioapi 0.16.0 2024-03-24 [1] CRAN (R 4.4.0) #&gt; sass 0.4.9 2024-03-15 [1] CRAN (R 4.4.0) #&gt; sessioninfo 1.2.2 2021-12-06 [1] CRAN (R 4.4.0) #&gt; Statamarkdown * 0.9.2 2023-12-04 [1] CRAN (R 4.4.0) #&gt; xfun 0.43 2024-03-25 [1] CRAN (R 4.4.0) #&gt; yaml 2.3.8 2023-12-11 [1] CRAN (R 4.4.0) #&gt; #&gt; [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library #&gt; #&gt; ────────────────────────────────────────────────────────────────────────────── Hernán, Miguel A, and James M Robins. 2020. Causal Inference: What If. Boca Raton: Chapman &amp; Hall/CRC. "],["404.html", "Page not found", " Page not found The page you requested cannot be found (perhaps it was moved or renamed). You may want to try searching to find the page's new location, or use the table of contents to find the page you are looking for. "]]
+[["index.html", "Causal Inference: What If. R and Stata code for Exercises Preface Downloading the code Installing dependency packages Downloading the datasets", " Causal Inference: What If. R and Stata code for Exercises Book by M. A. Hernán and J. M. Robins R code by Joy Shi and Sean McGrath Stata code by Eleanor Murray and Roger Logan R Markdown code by Tom Palmer 16 June 2024 Preface This book presents code examples from Hernán and Robins (2020), which is available in draft form from the following webpage. https://www.hsph.harvard.edu/miguel-hernan/causal-inference-book/ The R code is based on the code by Joy Shi and Sean McGrath given here. The Stata code is based on the code by Eleanor Murray and Roger Logan given here. This repo is rendered at https://remlapmot.github.io/cibookex-r/. Click the download button above for the pdf and eBook versions. Downloading the code The repo is available on GitHub here. There are a number of ways to download the code. Either, click the green Clone or download button then choose to Open in Desktop or Download ZIP. The Desktop option means open in the GitHub Desktop app (if you have that installed on your machine). The ZIP option will give you a zip archive of the repo, which you then unzip. or fork the repo into your own GitHub account and then clone or download your forked repo to your machine. Installing dependency packages It is easiest to open the repo in RStudio, as an RStudio project, by doubling click the .Rproj file. This makes sure that R’s working directory is at the top level of the repo. If you don’t want to open the repo as a project set the working directory to the top level of the repo directories using setwd(). Then run: # install.packages(&quot;devtools&quot;) # uncomment if devtools not installed devtools::install_dev_deps() Downloading the datasets We assume that you have downloaded the data from the Causal Inference Book website and saved it to a data subdirectory. You can do this manually or with the following code (nb. we use the here package to reference the data subdirectory). library(here) dataurls &lt;- list() stub &lt;- &quot;https://cdn1.sph.harvard.edu/wp-content/uploads/sites/1268/&quot; dataurls[[1]] &lt;- paste0(stub, &quot;2012/10/nhefs_sas.zip&quot;) dataurls[[2]] &lt;- paste0(stub, &quot;2012/10/nhefs_stata.zip&quot;) dataurls[[3]] &lt;- paste0(stub, &quot;2017/01/nhefs_excel.zip&quot;) dataurls[[4]] &lt;- paste0(stub, &quot;1268/20/nhefs.csv&quot;) temp &lt;- tempfile() for (i in 1:3) { download.file(dataurls[[i]], temp) unzip(temp, exdir = &quot;data&quot;) } download.file(dataurls[[4]], here(&quot;data&quot;, &quot;nhefs.csv&quot;)) References Hernán, Miguel A, and James M Robins. 2020. Causal Inference: What If. Boca Raton: Chapman &amp; Hall/CRC. "],["why-model.html", "11. Why model? Program 11.1 Program 11.2 Program 11.3", " 11. Why model? Program 11.1 Sample averages by treatment level Data from Figures 11.1 and 11.2 A &lt;- c(1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0) Y &lt;- c(200, 150, 220, 110, 50, 180, 90, 170, 170, 30, 70, 110, 80, 50, 10, 20) plot(A, Y) summary(Y[A == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 10.0 27.5 60.0 67.5 87.5 170.0 summary(Y[A == 1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 50.0 105.0 160.0 146.2 185.0 220.0 A2 &lt;- c(1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4) Y2 &lt;- c(110, 80, 50, 40, 170, 30, 70, 50, 110, 50, 180, 130, 200, 150, 220, 210) plot(A2, Y2) summary(Y2[A2 == 1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 40.0 47.5 65.0 70.0 87.5 110.0 summary(Y2[A2 == 2]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 30 45 60 80 95 170 summary(Y2[A2 == 3]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 50.0 95.0 120.0 117.5 142.5 180.0 summary(Y2[A2 == 4]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 150.0 187.5 205.0 195.0 212.5 220.0 Program 11.2 2-parameter linear model Data from Figures 11.3 and 11.1 A3 &lt;- c(3, 11, 17, 23, 29, 37, 41, 53, 67, 79, 83, 97, 60, 71, 15, 45) Y3 &lt;- c(21, 54, 33, 101, 85, 65, 157, 120, 111, 200, 140, 220, 230, 217, 11, 190) plot(Y3 ~ A3) summary(glm(Y3 ~ A3)) #&gt; #&gt; Call: #&gt; glm(formula = Y3 ~ A3) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 24.5464 21.3300 1.151 0.269094 #&gt; A3 2.1372 0.3997 5.347 0.000103 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 1944.109) #&gt; #&gt; Null deviance: 82800 on 15 degrees of freedom #&gt; Residual deviance: 27218 on 14 degrees of freedom #&gt; AIC: 170.43 #&gt; #&gt; Number of Fisher Scoring iterations: 2 predict(glm(Y3 ~ A3), data.frame(A3 = 90)) #&gt; 1 #&gt; 216.89 summary(glm(Y ~ A)) #&gt; #&gt; Call: #&gt; glm(formula = Y ~ A) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 67.50 19.72 3.424 0.00412 ** #&gt; A 78.75 27.88 2.824 0.01352 * #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 3109.821) #&gt; #&gt; Null deviance: 68344 on 15 degrees of freedom #&gt; Residual deviance: 43538 on 14 degrees of freedom #&gt; AIC: 177.95 #&gt; #&gt; Number of Fisher Scoring iterations: 2 Program 11.3 3-parameter linear model Data from Figure 11.3 Asq &lt;- A3 * A3 mod3 &lt;- glm(Y3 ~ A3 + Asq) summary(mod3) #&gt; #&gt; Call: #&gt; glm(formula = Y3 ~ A3 + Asq) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -7.40688 31.74777 -0.233 0.8192 #&gt; A3 4.10723 1.53088 2.683 0.0188 * #&gt; Asq -0.02038 0.01532 -1.331 0.2062 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 1842.697) #&gt; #&gt; Null deviance: 82800 on 15 degrees of freedom #&gt; Residual deviance: 23955 on 13 degrees of freedom #&gt; AIC: 170.39 #&gt; #&gt; Number of Fisher Scoring iterations: 2 predict(mod3, data.frame(cbind(A3 = 90, Asq = 8100))) #&gt; 1 #&gt; 197.1269 "],["ip-weighting-and-marginal-structural-models.html", "12. IP Weighting and Marginal Structural Models Program 12.1 Program 12.2 Program 12.3 Program 12.4 Program 12.5 Program 12.6 Program 12.7", " 12. IP Weighting and Marginal Structural Models Program 12.1 Descriptive statistics from NHEFS data (Table 12.1) library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # provisionally ignore subjects with missing values for weight in 1982 nhefs.nmv &lt;- nhefs[which(!is.na(nhefs$wt82)),] lm(wt82_71 ~ qsmk, data = nhefs.nmv) #&gt; #&gt; Call: #&gt; lm(formula = wt82_71 ~ qsmk, data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; (Intercept) qsmk #&gt; 1.984 2.541 # Smoking cessation predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 1)) #&gt; 1 #&gt; 4.525079 # No smoking cessation predict(lm(wt82_71 ~ qsmk, data = nhefs.nmv), data.frame(qsmk = 0)) #&gt; 1 #&gt; 1.984498 # Table summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$age) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 25.00 33.00 42.00 42.79 51.00 72.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 40.82 59.19 68.49 70.30 79.38 151.73 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeintensity) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 20.00 21.19 30.00 60.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 0),]$smokeyrs) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 23.00 24.09 32.00 64.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$age) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 25.00 35.00 46.00 46.17 56.00 74.00 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 39.58 60.67 71.21 72.35 81.08 136.98 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeintensity) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.0 10.0 20.0 18.6 25.0 80.0 summary(nhefs.nmv[which(nhefs.nmv$qsmk == 1),]$smokeyrs) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 15.00 26.00 26.03 35.00 60.00 table(nhefs.nmv$qsmk, nhefs.nmv$sex) #&gt; #&gt; 0 1 #&gt; 0 542 621 #&gt; 1 220 183 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$sex), 1) #&gt; #&gt; 0 1 #&gt; 0 0.4660361 0.5339639 #&gt; 1 0.5459057 0.4540943 table(nhefs.nmv$qsmk, nhefs.nmv$race) #&gt; #&gt; 0 1 #&gt; 0 993 170 #&gt; 1 367 36 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$race), 1) #&gt; #&gt; 0 1 #&gt; 0 0.85382631 0.14617369 #&gt; 1 0.91066998 0.08933002 table(nhefs.nmv$qsmk, nhefs.nmv$education) #&gt; #&gt; 1 2 3 4 5 #&gt; 0 210 266 480 92 115 #&gt; 1 81 74 157 29 62 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$education), 1) #&gt; #&gt; 1 2 3 4 5 #&gt; 0 0.18056750 0.22871883 0.41272571 0.07910576 0.09888220 #&gt; 1 0.20099256 0.18362283 0.38957816 0.07196030 0.15384615 table(nhefs.nmv$qsmk, nhefs.nmv$exercise) #&gt; #&gt; 0 1 2 #&gt; 0 237 485 441 #&gt; 1 63 176 164 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$exercise), 1) #&gt; #&gt; 0 1 2 #&gt; 0 0.2037833 0.4170249 0.3791917 #&gt; 1 0.1563275 0.4367246 0.4069479 table(nhefs.nmv$qsmk, nhefs.nmv$active) #&gt; #&gt; 0 1 2 #&gt; 0 532 527 104 #&gt; 1 170 188 45 prop.table(table(nhefs.nmv$qsmk, nhefs.nmv$active), 1) #&gt; #&gt; 0 1 2 #&gt; 0 0.4574377 0.4531384 0.0894239 #&gt; 1 0.4218362 0.4665012 0.1116625 Program 12.2 Estimating IP weights Data from NHEFS # Estimation of ip weights via a logistic model fit &lt;- glm( qsmk ~ sex + race + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + #&gt; as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), #&gt; family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.2425191 1.3808360 -1.624 0.104369 #&gt; sex -0.5274782 0.1540496 -3.424 0.000617 *** #&gt; race -0.8392636 0.2100665 -3.995 6.46e-05 *** #&gt; age 0.1212052 0.0512663 2.364 0.018068 * #&gt; I(age^2) -0.0008246 0.0005361 -1.538 0.124039 #&gt; as.factor(education)2 -0.0287755 0.1983506 -0.145 0.884653 #&gt; as.factor(education)3 0.0864318 0.1780850 0.485 0.627435 #&gt; as.factor(education)4 0.0636010 0.2732108 0.233 0.815924 #&gt; as.factor(education)5 0.4759606 0.2262237 2.104 0.035384 * #&gt; smokeintensity -0.0772704 0.0152499 -5.067 4.04e-07 *** #&gt; I(smokeintensity^2) 0.0010451 0.0002866 3.647 0.000265 *** #&gt; smokeyrs -0.0735966 0.0277775 -2.650 0.008061 ** #&gt; I(smokeyrs^2) 0.0008441 0.0004632 1.822 0.068398 . #&gt; as.factor(exercise)1 0.3548405 0.1801351 1.970 0.048855 * #&gt; as.factor(exercise)2 0.3957040 0.1872400 2.113 0.034571 * #&gt; as.factor(active)1 0.0319445 0.1329372 0.240 0.810100 #&gt; as.factor(active)2 0.1767840 0.2149720 0.822 0.410873 #&gt; wt71 -0.0152357 0.0263161 -0.579 0.562625 #&gt; I(wt71^2) 0.0001352 0.0001632 0.829 0.407370 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1714.9 #&gt; #&gt; Number of Fisher Scoring iterations: 4 p.qsmk.obs &lt;- ifelse(nhefs.nmv$qsmk == 0, 1 - predict(fit, type = &quot;response&quot;), predict(fit, type = &quot;response&quot;)) nhefs.nmv$w &lt;- 1 / p.qsmk.obs summary(nhefs.nmv$w) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.054 1.230 1.373 1.996 1.990 16.700 sd(nhefs.nmv$w) #&gt; [1] 1.474787 # install.packages(&quot;geepack&quot;) # install package if required library(&quot;geepack&quot;) msm.w &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, id = seqn, corstr = &quot;independence&quot; ) summary(msm.w) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = w, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.7800 0.2247 62.73 2.33e-15 *** #&gt; qsmk 3.4405 0.5255 42.87 5.86e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 65.06 4.221 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.w) SE &lt;- coef(summary(msm.w))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.780 1.340 2.22 #&gt; qsmk 3.441 2.411 4.47 # no association between sex and qsmk in pseudo-population xtabs(nhefs.nmv$w ~ nhefs.nmv$sex + nhefs.nmv$qsmk) #&gt; nhefs.nmv$qsmk #&gt; nhefs.nmv$sex 0 1 #&gt; 0 763.6 763.6 #&gt; 1 801.7 797.2 # &quot;check&quot; for positivity (White women) table(nhefs.nmv$age[nhefs.nmv$race == 0 &amp; nhefs.nmv$sex == 1], nhefs.nmv$qsmk[nhefs.nmv$race == 0 &amp; nhefs.nmv$sex == 1]) #&gt; #&gt; 0 1 #&gt; 25 24 3 #&gt; 26 14 5 #&gt; 27 18 2 #&gt; 28 20 5 #&gt; 29 15 4 #&gt; 30 14 5 #&gt; 31 11 5 #&gt; 32 14 7 #&gt; 33 12 3 #&gt; 34 22 5 #&gt; 35 16 5 #&gt; 36 13 3 #&gt; 37 14 1 #&gt; 38 6 2 #&gt; 39 19 4 #&gt; 40 10 4 #&gt; 41 13 3 #&gt; 42 16 3 #&gt; 43 14 3 #&gt; 44 9 4 #&gt; 45 12 5 #&gt; 46 19 4 #&gt; 47 19 4 #&gt; 48 19 4 #&gt; 49 11 3 #&gt; 50 18 4 #&gt; 51 9 3 #&gt; 52 11 3 #&gt; 53 11 4 #&gt; 54 17 9 #&gt; 55 9 4 #&gt; 56 8 7 #&gt; 57 9 2 #&gt; 58 8 4 #&gt; 59 5 4 #&gt; 60 5 4 #&gt; 61 5 2 #&gt; 62 6 5 #&gt; 63 3 3 #&gt; 64 7 1 #&gt; 65 3 2 #&gt; 66 4 0 #&gt; 67 2 0 #&gt; 69 6 2 #&gt; 70 2 1 #&gt; 71 0 1 #&gt; 72 2 2 #&gt; 74 0 1 Program 12.3 Estimating stabilized IP weights Data from NHEFS # estimation of denominator of ip weights denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.242519 1.380836 -1.62 0.10437 #&gt; as.factor(sex)1 -0.527478 0.154050 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.839264 0.210067 -4.00 6.5e-05 *** #&gt; age 0.121205 0.051266 2.36 0.01807 * #&gt; I(age^2) -0.000825 0.000536 -1.54 0.12404 #&gt; as.factor(education)2 -0.028776 0.198351 -0.15 0.88465 #&gt; as.factor(education)3 0.086432 0.178085 0.49 0.62744 #&gt; as.factor(education)4 0.063601 0.273211 0.23 0.81592 #&gt; as.factor(education)5 0.475961 0.226224 2.10 0.03538 * #&gt; smokeintensity -0.077270 0.015250 -5.07 4.0e-07 *** #&gt; I(smokeintensity^2) 0.001045 0.000287 3.65 0.00027 *** #&gt; smokeyrs -0.073597 0.027777 -2.65 0.00806 ** #&gt; I(smokeyrs^2) 0.000844 0.000463 1.82 0.06840 . #&gt; as.factor(exercise)1 0.354841 0.180135 1.97 0.04885 * #&gt; as.factor(exercise)2 0.395704 0.187240 2.11 0.03457 * #&gt; as.factor(active)1 0.031944 0.132937 0.24 0.81010 #&gt; as.factor(active)2 0.176784 0.214972 0.82 0.41087 #&gt; wt71 -0.015236 0.026316 -0.58 0.56262 #&gt; I(wt71^2) 0.000135 0.000163 0.83 0.40737 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1715 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights numer.fit &lt;- glm(qsmk ~ 1, family = binomial(), data = nhefs.nmv) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.0598 0.0578 -18.3 &lt;2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1786.1 on 1565 degrees of freedom #&gt; AIC: 1788 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) nhefs.nmv$sw &lt;- ifelse(nhefs.nmv$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) summary(nhefs.nmv$sw) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.331 0.867 0.950 0.999 1.079 4.298 msm.sw &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs.nmv, weights = sw, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.780 0.225 62.7 2.3e-15 *** #&gt; qsmk 3.441 0.525 42.9 5.9e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.7 3.71 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.sw) SE &lt;- coef(summary(msm.sw))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.78 1.34 2.22 #&gt; qsmk 3.44 2.41 4.47 # no association between sex and qsmk in pseudo-population xtabs(nhefs.nmv$sw ~ nhefs.nmv$sex + nhefs.nmv$qsmk) #&gt; nhefs.nmv$qsmk #&gt; nhefs.nmv$sex 0 1 #&gt; 0 567 197 #&gt; 1 595 205 Program 12.4 Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS # Analysis restricted to subjects reporting &lt;=25 cig/day at baseline nhefs.nmv.s &lt;- subset(nhefs.nmv, smokeintensity &lt;= 25) # estimation of denominator of ip weights den.fit.obj &lt;- lm( smkintensity82_71 ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), data = nhefs.nmv.s ) p.den &lt;- predict(den.fit.obj, type = &quot;response&quot;) dens.den &lt;- dnorm(nhefs.nmv.s$smkintensity82_71, p.den, summary(den.fit.obj)$sigma) # estimation of numerator of ip weights num.fit.obj &lt;- lm(smkintensity82_71 ~ 1, data = nhefs.nmv.s) p.num &lt;- predict(num.fit.obj, type = &quot;response&quot;) dens.num &lt;- dnorm(nhefs.nmv.s$smkintensity82_71, p.num, summary(num.fit.obj)$sigma) nhefs.nmv.s$sw.a &lt;- dens.num / dens.den summary(nhefs.nmv.s$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.19 0.89 0.97 1.00 1.05 5.10 msm.sw.cont &lt;- geeglm( wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw.cont) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ smkintensity82_71 + I(smkintensity82_71 * #&gt; smkintensity82_71), data = nhefs.nmv.s, weights = sw.a, id = seqn, #&gt; corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 2.00452 0.29512 46.13 1.1e-11 *** #&gt; smkintensity82_71 -0.10899 0.03154 11.94 0.00055 *** #&gt; I(smkintensity82_71 * smkintensity82_71) 0.00269 0.00242 1.24 0.26489 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.5 4.5 #&gt; Number of clusters: 1162 Maximum cluster size: 1 beta &lt;- coef(msm.sw.cont) SE &lt;- coef(summary(msm.sw.cont))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 2.00452 1.42610 2.58295 #&gt; smkintensity82_71 -0.10899 -0.17080 -0.04718 #&gt; I(smkintensity82_71 * smkintensity82_71) 0.00269 -0.00204 0.00743 Program 12.5 Estimating the parameters of a marginal structural logistic model Data from NHEFS table(nhefs.nmv$qsmk, nhefs.nmv$death) #&gt; #&gt; 0 1 #&gt; 0 963 200 #&gt; 1 312 91 # First, estimation of stabilized weights sw (same as in Program 12.3) # Second, fit logistic model below msm.logistic &lt;- geeglm( death ~ qsmk, data = nhefs.nmv, weights = sw, id = seqn, family = binomial(), corstr = &quot;independence&quot; ) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(msm.logistic) #&gt; #&gt; Call: #&gt; geeglm(formula = death ~ qsmk, family = binomial(), data = nhefs.nmv, #&gt; weights = sw, id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) -1.4905 0.0789 356.50 &lt;2e-16 *** #&gt; qsmk 0.0301 0.1573 0.04 0.85 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 1 0.0678 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.logistic) SE &lt;- coef(summary(msm.logistic))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) -1.4905 -1.645 -1.336 #&gt; qsmk 0.0301 -0.278 0.338 Program 12.6 Assessing effect modification by sex using a marginal structural mean model Data from NHEFS table(nhefs.nmv$sex) #&gt; #&gt; 0 1 #&gt; 762 804 # estimation of denominator of ip weights denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs.nmv ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.242519 1.380836 -1.62 0.10437 #&gt; as.factor(sex)1 -0.527478 0.154050 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.839264 0.210067 -4.00 6.5e-05 *** #&gt; age 0.121205 0.051266 2.36 0.01807 * #&gt; I(age^2) -0.000825 0.000536 -1.54 0.12404 #&gt; as.factor(education)2 -0.028776 0.198351 -0.15 0.88465 #&gt; as.factor(education)3 0.086432 0.178085 0.49 0.62744 #&gt; as.factor(education)4 0.063601 0.273211 0.23 0.81592 #&gt; as.factor(education)5 0.475961 0.226224 2.10 0.03538 * #&gt; smokeintensity -0.077270 0.015250 -5.07 4.0e-07 *** #&gt; I(smokeintensity^2) 0.001045 0.000287 3.65 0.00027 *** #&gt; smokeyrs -0.073597 0.027777 -2.65 0.00806 ** #&gt; I(smokeyrs^2) 0.000844 0.000463 1.82 0.06840 . #&gt; as.factor(exercise)1 0.354841 0.180135 1.97 0.04885 * #&gt; as.factor(exercise)2 0.395704 0.187240 2.11 0.03457 * #&gt; as.factor(active)1 0.031944 0.132937 0.24 0.81010 #&gt; as.factor(active)2 0.176784 0.214972 0.82 0.41087 #&gt; wt71 -0.015236 0.026316 -0.58 0.56262 #&gt; I(wt71^2) 0.000135 0.000163 0.83 0.40737 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1676.9 on 1547 degrees of freedom #&gt; AIC: 1715 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights numer.fit &lt;- glm(qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex), family = binomial(), data = nhefs.nmv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -0.9016 0.0799 -11.28 &lt;2e-16 *** #&gt; as.factor(sex)1 -0.3202 0.1160 -2.76 0.0058 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1786.1 on 1565 degrees of freedom #&gt; Residual deviance: 1778.4 on 1564 degrees of freedom #&gt; AIC: 1782 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) nhefs.nmv$sw.a &lt;- ifelse(nhefs.nmv$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) summary(nhefs.nmv$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.29 0.88 0.96 1.00 1.08 3.80 sd(nhefs.nmv$sw.a) #&gt; [1] 0.271 # Estimating parameters of a marginal structural mean model msm.emm &lt;- geeglm( wt82_71 ~ as.factor(qsmk) + as.factor(sex) + as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, id = seqn, corstr = &quot;independence&quot; ) summary(msm.emm) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ as.factor(qsmk) + as.factor(sex) + #&gt; as.factor(qsmk):as.factor(sex), data = nhefs.nmv, weights = sw.a, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.78445 0.30984 33.17 8.5e-09 *** #&gt; as.factor(qsmk)1 3.52198 0.65707 28.73 8.3e-08 *** #&gt; as.factor(sex)1 -0.00872 0.44882 0.00 0.98 #&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 1.04608 0.02 0.88 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 60.8 3.71 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.emm) SE &lt;- coef(summary(msm.emm))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.78445 1.177 2.392 #&gt; as.factor(qsmk)1 3.52198 2.234 4.810 #&gt; as.factor(sex)1 -0.00872 -0.888 0.871 #&gt; as.factor(qsmk)1:as.factor(sex)1 -0.15948 -2.210 1.891 Program 12.7 Estimating IP weights to adjust for selection bias due to censoring Data from NHEFS table(nhefs$qsmk, nhefs$cens) #&gt; #&gt; 0 1 #&gt; 0 1163 38 #&gt; 1 403 25 summary(nhefs[which(nhefs$cens == 0),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 39.6 59.5 69.2 70.8 79.8 151.7 summary(nhefs[which(nhefs$cens == 1),]$wt71) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 36.2 63.1 72.1 76.6 87.9 169.2 # estimation of denominator of ip weights for A denom.fit &lt;- glm( qsmk ~ as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs ) summary(denom.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ as.factor(sex) + as.factor(race) + age + #&gt; I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.988902 1.241279 -1.60 0.10909 #&gt; as.factor(sex)1 -0.507522 0.148232 -3.42 0.00062 *** #&gt; as.factor(race)1 -0.850231 0.205872 -4.13 3.6e-05 *** #&gt; age 0.103013 0.048900 2.11 0.03515 * #&gt; I(age^2) -0.000605 0.000507 -1.19 0.23297 #&gt; as.factor(education)2 -0.098320 0.190655 -0.52 0.60607 #&gt; as.factor(education)3 0.015699 0.170714 0.09 0.92673 #&gt; as.factor(education)4 -0.042526 0.264276 -0.16 0.87216 #&gt; as.factor(education)5 0.379663 0.220395 1.72 0.08495 . #&gt; smokeintensity -0.065156 0.014759 -4.41 1.0e-05 *** #&gt; I(smokeintensity^2) 0.000846 0.000276 3.07 0.00216 ** #&gt; smokeyrs -0.073371 0.026996 -2.72 0.00657 ** #&gt; I(smokeyrs^2) 0.000838 0.000443 1.89 0.05867 . #&gt; as.factor(exercise)1 0.291412 0.173554 1.68 0.09314 . #&gt; as.factor(exercise)2 0.355052 0.179929 1.97 0.04846 * #&gt; as.factor(active)1 0.010875 0.129832 0.08 0.93324 #&gt; as.factor(active)2 0.068312 0.208727 0.33 0.74346 #&gt; wt71 -0.012848 0.022283 -0.58 0.56423 #&gt; I(wt71^2) 0.000121 0.000135 0.89 0.37096 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1766.7 on 1610 degrees of freedom #&gt; AIC: 1805 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pd.qsmk &lt;- predict(denom.fit, type = &quot;response&quot;) # estimation of numerator of ip weights for A numer.fit &lt;- glm(qsmk ~ 1, family = binomial(), data = nhefs) summary(numer.fit) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ 1, family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.0318 0.0563 -18.3 &lt;2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1876.3 on 1628 degrees of freedom #&gt; AIC: 1878 #&gt; #&gt; Number of Fisher Scoring iterations: 4 pn.qsmk &lt;- predict(numer.fit, type = &quot;response&quot;) # estimation of denominator of ip weights for C denom.cens &lt;- glm( cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + age + I(age ^ 2) + as.factor(education) + smokeintensity + I(smokeintensity ^ 2) + smokeyrs + I(smokeyrs ^ 2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 ^ 2), family = binomial(), data = nhefs ) summary(denom.cens) #&gt; #&gt; Call: #&gt; glm(formula = cens ~ as.factor(qsmk) + as.factor(sex) + as.factor(race) + #&gt; age + I(age^2) + as.factor(education) + smokeintensity + #&gt; I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71^2), family = binomial(), #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 4.014466 2.576106 1.56 0.1192 #&gt; as.factor(qsmk)1 0.516867 0.287716 1.80 0.0724 . #&gt; as.factor(sex)1 0.057313 0.330278 0.17 0.8622 #&gt; as.factor(race)1 -0.012271 0.452489 -0.03 0.9784 #&gt; age -0.269729 0.117465 -2.30 0.0217 * #&gt; I(age^2) 0.002884 0.001114 2.59 0.0096 ** #&gt; as.factor(education)2 -0.440788 0.419399 -1.05 0.2933 #&gt; as.factor(education)3 -0.164688 0.370547 -0.44 0.6567 #&gt; as.factor(education)4 0.138447 0.569797 0.24 0.8080 #&gt; as.factor(education)5 -0.382382 0.560181 -0.68 0.4949 #&gt; smokeintensity 0.015712 0.034732 0.45 0.6510 #&gt; I(smokeintensity^2) -0.000113 0.000606 -0.19 0.8517 #&gt; smokeyrs 0.078597 0.074958 1.05 0.2944 #&gt; I(smokeyrs^2) -0.000557 0.001032 -0.54 0.5894 #&gt; as.factor(exercise)1 -0.971471 0.387810 -2.51 0.0122 * #&gt; as.factor(exercise)2 -0.583989 0.372313 -1.57 0.1168 #&gt; as.factor(active)1 -0.247479 0.325455 -0.76 0.4470 #&gt; as.factor(active)2 0.706583 0.396458 1.78 0.0747 . #&gt; wt71 -0.087887 0.040012 -2.20 0.0281 * #&gt; I(wt71^2) 0.000635 0.000226 2.81 0.0049 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 465.36 on 1609 degrees of freedom #&gt; AIC: 505.4 #&gt; #&gt; Number of Fisher Scoring iterations: 7 pd.cens &lt;- 1 - predict(denom.cens, type = &quot;response&quot;) # estimation of numerator of ip weights for C numer.cens &lt;- glm(cens ~ as.factor(qsmk), family = binomial(), data = nhefs) summary(numer.cens) #&gt; #&gt; Call: #&gt; glm(formula = cens ~ as.factor(qsmk), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -3.421 0.165 -20.75 &lt;2e-16 *** #&gt; as.factor(qsmk)1 0.641 0.264 2.43 0.015 * #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 527.76 on 1627 degrees of freedom #&gt; AIC: 531.8 #&gt; #&gt; Number of Fisher Scoring iterations: 6 pn.cens &lt;- 1 - predict(numer.cens, type = &quot;response&quot;) nhefs$sw.a &lt;- ifelse(nhefs$qsmk == 0, ((1 - pn.qsmk) / (1 - pd.qsmk)), (pn.qsmk / pd.qsmk)) nhefs$sw.c &lt;- pn.cens / pd.cens nhefs$sw &lt;- nhefs$sw.c * nhefs$sw.a summary(nhefs$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.33 0.86 0.95 1.00 1.08 4.21 sd(nhefs$sw.a) #&gt; [1] 0.284 summary(nhefs$sw.c) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.94 0.98 0.99 1.01 1.01 7.58 sd(nhefs$sw.c) #&gt; [1] 0.178 summary(nhefs$sw) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.35 0.86 0.94 1.01 1.08 12.86 sd(nhefs$sw) #&gt; [1] 0.411 msm.sw &lt;- geeglm( wt82_71 ~ qsmk, data = nhefs, weights = sw, id = seqn, corstr = &quot;independence&quot; ) summary(msm.sw) #&gt; #&gt; Call: #&gt; geeglm(formula = wt82_71 ~ qsmk, data = nhefs, weights = sw, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 1.662 0.233 51.0 9.3e-13 *** #&gt; qsmk 3.496 0.526 44.2 2.9e-11 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 61.8 3.83 #&gt; Number of clusters: 1566 Maximum cluster size: 1 beta &lt;- coef(msm.sw) SE &lt;- coef(summary(msm.sw))[, 2] lcl &lt;- beta - qnorm(0.975) * SE ucl &lt;- beta + qnorm(0.975) * SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 1.66 1.21 2.12 #&gt; qsmk 3.50 2.47 4.53 "],["standardization-and-the-parametric-g-formula.html", "13. Standardization and the parametric G-formula Program 13.1 Program 13.2 Program 13.3 Program 13.4", " 13. Standardization and the parametric G-formula Program 13.1 Estimating the mean outcome within levels of treatment and confounders Data from NHEFS library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) fit &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, data = nhefs ) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; qsmk:smokeintensity 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 nhefs$predicted.meanY &lt;- predict(fit, nhefs) nhefs[which(nhefs$seqn == 24770), c( &quot;predicted.meanY&quot;, &quot;qsmk&quot;, &quot;sex&quot;, &quot;race&quot;, &quot;age&quot;, &quot;education&quot;, &quot;smokeintensity&quot;, &quot;smokeyrs&quot;, &quot;exercise&quot;, &quot;active&quot;, &quot;wt71&quot; )] #&gt; # A tibble: 1 × 11 #&gt; predicted.meanY qsmk sex race age education smokeintensity smokeyrs #&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; #&gt; 1 0.342 0 0 0 26 4 15 12 #&gt; # ℹ 3 more variables: exercise &lt;dbl&gt;, active &lt;dbl&gt;, wt71 &lt;dbl&gt; summary(nhefs$predicted.meanY[nhefs$cens == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -10.876 1.116 3.042 2.638 4.511 9.876 summary(nhefs$wt82_71[nhefs$cens == 0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -41.280 -1.478 2.604 2.638 6.690 48.538 Program 13.2 Standardizing the mean outcome to the baseline confounders Data from Table 2.2 id &lt;- c( &quot;Rheia&quot;, &quot;Kronos&quot;, &quot;Demeter&quot;, &quot;Hades&quot;, &quot;Hestia&quot;, &quot;Poseidon&quot;, &quot;Hera&quot;, &quot;Zeus&quot;, &quot;Artemis&quot;, &quot;Apollo&quot;, &quot;Leto&quot;, &quot;Ares&quot;, &quot;Athena&quot;, &quot;Hephaestus&quot;, &quot;Aphrodite&quot;, &quot;Cyclope&quot;, &quot;Persephone&quot;, &quot;Hermes&quot;, &quot;Hebe&quot;, &quot;Dionysus&quot; ) N &lt;- length(id) L &lt;- c(0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1) A &lt;- c(0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1) Y &lt;- c(0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0) interv &lt;- rep(-1, N) observed &lt;- cbind(L, A, Y, interv) untreated &lt;- cbind(L, rep(0, N), rep(NA, N), rep(0, N)) treated &lt;- cbind(L, rep(1, N), rep(NA, N), rep(1, N)) table22 &lt;- as.data.frame(rbind(observed, untreated, treated)) table22$id &lt;- rep(id, 3) glm.obj &lt;- glm(Y ~ A * L, data = table22) summary(glm.obj) #&gt; #&gt; Call: #&gt; glm(formula = Y ~ A * L, data = table22) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 2.500e-01 2.552e-01 0.980 0.342 #&gt; A 3.957e-17 3.608e-01 0.000 1.000 #&gt; L 4.167e-01 3.898e-01 1.069 0.301 #&gt; A:L -1.313e-16 4.959e-01 0.000 1.000 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 0.2604167) #&gt; #&gt; Null deviance: 5.0000 on 19 degrees of freedom #&gt; Residual deviance: 4.1667 on 16 degrees of freedom #&gt; (40 observations deleted due to missingness) #&gt; AIC: 35.385 #&gt; #&gt; Number of Fisher Scoring iterations: 2 table22$predicted.meanY &lt;- predict(glm.obj, table22) mean(table22$predicted.meanY[table22$interv == -1]) #&gt; [1] 0.5 mean(table22$predicted.meanY[table22$interv == 0]) #&gt; [1] 0.5 mean(table22$predicted.meanY[table22$interv == 1]) #&gt; [1] 0.5 Program 13.3 Standardizing the mean outcome to the baseline confounders: Data from NHEFS # create a dataset with 3 copies of each subject nhefs$interv &lt;- -1 # 1st copy: equal to original one interv0 &lt;- nhefs # 2nd copy: treatment set to 0, outcome to missing interv0$interv &lt;- 0 interv0$qsmk &lt;- 0 interv0$wt82_71 &lt;- NA interv1 &lt;- nhefs # 3rd copy: treatment set to 1, outcome to missing interv1$interv &lt;- 1 interv1$qsmk &lt;- 1 interv1$wt82_71 &lt;- NA onesample &lt;- rbind(nhefs, interv0, interv1) # combining datasets # linear model to estimate mean outcome conditional on treatment and confounders # parameters are estimated using original observations only (nhefs) # parameter estimates are used to predict mean outcome for observations with # treatment set to 0 (interv=0) and to 1 (interv=1) std &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), data = onesample ) summary(std) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = onesample) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; I(qsmk * smokeintensity) 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (3321 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 onesample$predicted_meanY &lt;- predict(std, onesample) # estimate mean outcome in each of the groups interv=0, and interv=1 # this mean outcome is a weighted average of the mean outcomes in each combination # of values of treatment and confounders, that is, the standardized outcome mean(onesample[which(onesample$interv == -1), ]$predicted_meanY) #&gt; [1] 2.56319 mean(onesample[which(onesample$interv == 0), ]$predicted_meanY) #&gt; [1] 1.660267 mean(onesample[which(onesample$interv == 1), ]$predicted_meanY) #&gt; [1] 5.178841 Program 13.4 Computing the 95% confidence interval of the standardized means and their difference Data from NHEFS #install.packages(&quot;boot&quot;) # install package if required library(boot) # function to calculate difference in means standardization &lt;- function(data, indices) { # create a dataset with 3 copies of each subject d &lt;- data[indices, ] # 1st copy: equal to original one` d$interv &lt;- -1 d0 &lt;- d # 2nd copy: treatment set to 0, outcome to missing d0$interv &lt;- 0 d0$qsmk &lt;- 0 d0$wt82_71 &lt;- NA d1 &lt;- d # 3rd copy: treatment set to 1, outcome to missing d1$interv &lt;- 1 d1$qsmk &lt;- 1 d1$wt82_71 &lt;- NA d.onesample &lt;- rbind(d, d0, d1) # combining datasets # linear model to estimate mean outcome conditional on treatment and confounders # parameters are estimated using original observations only (interv= -1) # parameter estimates are used to predict mean outcome for observations with set # treatment (interv=0 and interv=1) fit &lt;- glm( wt82_71 ~ qsmk + sex + race + age + I(age * age) + as.factor(education) + smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71 * wt71), data = d.onesample ) d.onesample$predicted_meanY &lt;- predict(fit, d.onesample) # estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1 return(c( mean(d.onesample$predicted_meanY[d.onesample$interv == -1]), mean(d.onesample$predicted_meanY[d.onesample$interv == 0]), mean(d.onesample$predicted_meanY[d.onesample$interv == 1]), mean(d.onesample$predicted_meanY[d.onesample$interv == 1]) - mean(d.onesample$predicted_meanY[d.onesample$interv == 0]) )) } # bootstrap results &lt;- boot(data = nhefs, statistic = standardization, R = 5) # generating confidence intervals se &lt;- c(sd(results$t[, 1]), sd(results$t[, 2]), sd(results$t[, 3]), sd(results$t[, 4])) mean &lt;- results$t0 ll &lt;- mean - qnorm(0.975) * se ul &lt;- mean + qnorm(0.975) * se bootstrap &lt;- data.frame(cbind( c( &quot;Observed&quot;, &quot;No Treatment&quot;, &quot;Treatment&quot;, &quot;Treatment - No Treatment&quot; ), mean, se, ll, ul )) bootstrap #&gt; V1 mean se ll #&gt; 1 Observed 2.56188497106099 0.145472494596704 2.27676412091025 #&gt; 2 No Treatment 1.65212306626744 0.101915266567174 1.45237281432098 #&gt; 3 Treatment 5.11474489549336 0.333215898342795 4.46165373566532 #&gt; 4 Treatment - No Treatment 3.46262182922592 0.301829821703863 2.8710462492262 #&gt; ul #&gt; 1 2.84700582121172 #&gt; 2 1.8518733182139 #&gt; 3 5.76783605532139 #&gt; 4 4.05419740922564 "],["g-estimation-of-structural-nested-models.html", "14. G-estimation of Structural Nested Models Program 14.1 Program 14.2 Program 14.3", " 14. G-estimation of Structural Nested Models Program 14.1 Preprocessing, ranks of extreme observations, IP weights for censoring Data from NHEFS library(here) # install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some processing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # ranking of extreme observations #install.packages(&quot;Hmisc&quot;) library(Hmisc) #&gt; #&gt; Attaching package: &#39;Hmisc&#39; #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; format.pval, units describe(nhefs$wt82_71) #&gt; nhefs$wt82_71 #&gt; n missing distinct Info Mean Gmd .05 .10 #&gt; 1566 63 1510 1 2.638 8.337 -9.752 -6.292 #&gt; .25 .50 .75 .90 .95 #&gt; -1.478 2.604 6.690 11.117 14.739 #&gt; #&gt; lowest : -41.2805 -30.5019 -30.0501 -29.0258 -25.9706 #&gt; highest: 34.0178 36.9693 37.6505 47.5113 48.5384 # estimation of denominator of ip weights for C cw.denom &lt;- glm(cens==0 ~ qsmk + sex + race + age + I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), data = nhefs, family = binomial(&quot;logit&quot;)) summary(cw.denom) #&gt; #&gt; Call: #&gt; glm(formula = cens == 0 ~ qsmk + sex + race + age + I(age^2) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity^2) + #&gt; smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71^2), family = binomial(&quot;logit&quot;), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -4.0144661 2.5761058 -1.558 0.11915 #&gt; qsmk -0.5168674 0.2877162 -1.796 0.07242 . #&gt; sex -0.0573131 0.3302775 -0.174 0.86223 #&gt; race 0.0122715 0.4524887 0.027 0.97836 #&gt; age 0.2697293 0.1174647 2.296 0.02166 * #&gt; I(age^2) -0.0028837 0.0011135 -2.590 0.00961 ** #&gt; as.factor(education)2 0.4407884 0.4193993 1.051 0.29326 #&gt; as.factor(education)3 0.1646881 0.3705471 0.444 0.65672 #&gt; as.factor(education)4 -0.1384470 0.5697969 -0.243 0.80802 #&gt; as.factor(education)5 0.3823818 0.5601808 0.683 0.49486 #&gt; smokeintensity -0.0157119 0.0347319 -0.452 0.65100 #&gt; I(smokeintensity^2) 0.0001133 0.0006058 0.187 0.85171 #&gt; smokeyrs -0.0785973 0.0749576 -1.049 0.29438 #&gt; I(smokeyrs^2) 0.0005569 0.0010318 0.540 0.58938 #&gt; as.factor(exercise)1 0.9714714 0.3878101 2.505 0.01224 * #&gt; as.factor(exercise)2 0.5839890 0.3723133 1.569 0.11675 #&gt; as.factor(active)1 0.2474785 0.3254548 0.760 0.44701 #&gt; as.factor(active)2 -0.7065829 0.3964577 -1.782 0.07471 . #&gt; wt71 0.0878871 0.0400115 2.197 0.02805 * #&gt; I(wt71^2) -0.0006351 0.0002257 -2.813 0.00490 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 533.36 on 1628 degrees of freedom #&gt; Residual deviance: 465.36 on 1609 degrees of freedom #&gt; AIC: 505.36 #&gt; #&gt; Number of Fisher Scoring iterations: 7 nhefs$pd.c &lt;- predict(cw.denom, nhefs, type=&quot;response&quot;) nhefs$wc &lt;- ifelse(nhefs$cens==0, 1/nhefs$pd.c, NA) # observations with cens=1 only contribute to censoring models Program 14.2 G-estimation of a 1-parameter structural nested mean model Brute force search Data from NHEFS G-estimation: Checking one possible value of psi #install.packages(&quot;geepack&quot;) library(&quot;geepack&quot;) nhefs$psi &lt;- 3.446 nhefs$Hpsi &lt;- nhefs$wt82_71 - nhefs$psi*nhefs$qsmk fit &lt;- geeglm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + Hpsi, family=binomial, data=nhefs, weights=wc, id=seqn, corstr=&quot;independence&quot;) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(fit) #&gt; #&gt; Call: #&gt; geeglm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + #&gt; I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71 * wt71) + Hpsi, family = binomial, data = nhefs, #&gt; weights = wc, id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) -2.403e+00 1.329e+00 3.269 0.070604 . #&gt; sex -5.137e-01 1.536e-01 11.193 0.000821 *** #&gt; race -8.609e-01 2.099e-01 16.826 4.10e-05 *** #&gt; age 1.152e-01 5.020e-02 5.263 0.021779 * #&gt; I(age * age) -7.593e-04 5.296e-04 2.056 0.151619 #&gt; as.factor(education)2 -2.894e-02 1.964e-01 0.022 0.882859 #&gt; as.factor(education)3 8.771e-02 1.726e-01 0.258 0.611329 #&gt; as.factor(education)4 6.637e-02 2.698e-01 0.061 0.805645 #&gt; as.factor(education)5 4.711e-01 2.247e-01 4.395 0.036036 * #&gt; smokeintensity -7.834e-02 1.464e-02 28.635 8.74e-08 *** #&gt; I(smokeintensity * smokeintensity) 1.072e-03 2.650e-04 16.368 5.21e-05 *** #&gt; smokeyrs -7.111e-02 2.639e-02 7.261 0.007047 ** #&gt; I(smokeyrs * smokeyrs) 8.153e-04 4.490e-04 3.298 0.069384 . #&gt; as.factor(exercise)1 3.363e-01 1.828e-01 3.384 0.065844 . #&gt; as.factor(exercise)2 3.800e-01 1.889e-01 4.049 0.044187 * #&gt; as.factor(active)1 3.412e-02 1.339e-01 0.065 0.798778 #&gt; as.factor(active)2 2.135e-01 2.121e-01 1.012 0.314308 #&gt; wt71 -7.661e-03 2.562e-02 0.089 0.764963 #&gt; I(wt71 * wt71) 8.655e-05 1.582e-04 0.299 0.584233 #&gt; Hpsi -1.903e-06 8.839e-03 0.000 0.999828 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 0.9969 0.06717 #&gt; Number of clusters: 1566 Maximum cluster size: 1 G-estimation: Checking multiple possible values of psi #install.packages(&quot;geepack&quot;) grid &lt;- seq(from = 2,to = 5, by = 0.1) j = 0 Hpsi.coefs &lt;- cbind(rep(NA,length(grid)), rep(NA, length(grid))) colnames(Hpsi.coefs) &lt;- c(&quot;Estimate&quot;, &quot;p-value&quot;) for (i in grid){ psi = i j = j+1 nhefs$Hpsi &lt;- nhefs$wt82_71 - psi * nhefs$qsmk gest.fit &lt;- geeglm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + Hpsi, family=binomial, data=nhefs, weights=wc, id=seqn, corstr=&quot;independence&quot;) Hpsi.coefs[j,1] &lt;- summary(gest.fit)$coefficients[&quot;Hpsi&quot;, &quot;Estimate&quot;] Hpsi.coefs[j,2] &lt;- summary(gest.fit)$coefficients[&quot;Hpsi&quot;, &quot;Pr(&gt;|W|)&quot;] } #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! Hpsi.coefs #&gt; Estimate p-value #&gt; [1,] 0.0267219 0.001772 #&gt; [2,] 0.0248946 0.003580 #&gt; [3,] 0.0230655 0.006963 #&gt; [4,] 0.0212344 0.013026 #&gt; [5,] 0.0194009 0.023417 #&gt; [6,] 0.0175647 0.040430 #&gt; [7,] 0.0157254 0.067015 #&gt; [8,] 0.0138827 0.106626 #&gt; [9,] 0.0120362 0.162877 #&gt; [10,] 0.0101857 0.238979 #&gt; [11,] 0.0083308 0.337048 #&gt; [12,] 0.0064713 0.457433 #&gt; [13,] 0.0046069 0.598235 #&gt; [14,] 0.0027374 0.755204 #&gt; [15,] 0.0008624 0.922101 #&gt; [16,] -0.0010181 0.908537 #&gt; [17,] -0.0029044 0.744362 #&gt; [18,] -0.0047967 0.592188 #&gt; [19,] -0.0066950 0.457169 #&gt; [20,] -0.0085997 0.342360 #&gt; [21,] -0.0105107 0.248681 #&gt; [22,] -0.0124282 0.175239 #&gt; [23,] -0.0143523 0.119841 #&gt; [24,] -0.0162831 0.079580 #&gt; [25,] -0.0182206 0.051347 #&gt; [26,] -0.0201649 0.032218 #&gt; [27,] -0.0221160 0.019675 #&gt; [28,] -0.0240740 0.011706 #&gt; [29,] -0.0260389 0.006792 #&gt; [30,] -0.0280106 0.003847 #&gt; [31,] -0.0299893 0.002129 Program 14.3 G-estimation for 2-parameter structural nested mean model Closed form estimator Data from NHEFS G-estimation: Closed form estimator linear mean models logit.est &lt;- glm(qsmk ~ sex + race + age + I(age^2) + as.factor(education) + smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), data = nhefs, weight = wc, family = binomial()) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(logit.est) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age^2) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity^2) + smokeyrs + I(smokeyrs^2) + #&gt; as.factor(exercise) + as.factor(active) + wt71 + I(wt71^2), #&gt; family = binomial(), data = nhefs, weights = wc) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -2.40e+00 1.31e+00 -1.83 0.06743 . #&gt; sex -5.14e-01 1.50e-01 -3.42 0.00062 *** #&gt; race -8.61e-01 2.06e-01 -4.18 2.9e-05 *** #&gt; age 1.15e-01 4.95e-02 2.33 0.01992 * #&gt; I(age^2) -7.59e-04 5.14e-04 -1.48 0.13953 #&gt; as.factor(education)2 -2.89e-02 1.93e-01 -0.15 0.88079 #&gt; as.factor(education)3 8.77e-02 1.73e-01 0.51 0.61244 #&gt; as.factor(education)4 6.64e-02 2.66e-01 0.25 0.80301 #&gt; as.factor(education)5 4.71e-01 2.21e-01 2.13 0.03314 * #&gt; smokeintensity -7.83e-02 1.49e-02 -5.27 1.4e-07 *** #&gt; I(smokeintensity^2) 1.07e-03 2.78e-04 3.85 0.00012 *** #&gt; smokeyrs -7.11e-02 2.71e-02 -2.63 0.00862 ** #&gt; I(smokeyrs^2) 8.15e-04 4.45e-04 1.83 0.06722 . #&gt; as.factor(exercise)1 3.36e-01 1.75e-01 1.92 0.05467 . #&gt; as.factor(exercise)2 3.80e-01 1.82e-01 2.09 0.03637 * #&gt; as.factor(active)1 3.41e-02 1.30e-01 0.26 0.79337 #&gt; as.factor(active)2 2.13e-01 2.06e-01 1.04 0.30033 #&gt; wt71 -7.66e-03 2.46e-02 -0.31 0.75530 #&gt; I(wt71^2) 8.66e-05 1.51e-04 0.57 0.56586 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1872.2 on 1565 degrees of freedom #&gt; Residual deviance: 1755.6 on 1547 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 1719 #&gt; #&gt; Number of Fisher Scoring iterations: 4 nhefs$pqsmk &lt;- predict(logit.est, nhefs, type = &quot;response&quot;) describe(nhefs$pqsmk) #&gt; nhefs$pqsmk #&gt; n missing distinct Info Mean Gmd .05 .10 #&gt; 1629 0 1629 1 0.2622 0.1302 0.1015 0.1261 #&gt; .25 .50 .75 .90 .95 #&gt; 0.1780 0.2426 0.3251 0.4221 0.4965 #&gt; #&gt; lowest : 0.0514466 0.0515703 0.0543802 0.0558308 0.0593059 #&gt; highest: 0.672083 0.686432 0.713913 0.733299 0.78914 summary(nhefs$pqsmk) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.0514 0.1780 0.2426 0.2622 0.3251 0.7891 # solve sum(w_c * H(psi) * (qsmk - E[qsmk | L])) = 0 # for a single psi and H(psi) = wt82_71 - psi * qsmk # this can be solved as # psi = sum( w_c * wt82_71 * (qsmk - pqsmk)) / sum(w_c * qsmk * (qsmk - pqsmk)) nhefs.c &lt;- nhefs[which(!is.na(nhefs$wt82)),] with(nhefs.c, sum(wc*wt82_71*(qsmk-pqsmk)) / sum(wc*qsmk*(qsmk - pqsmk))) #&gt; [1] 3.446 G-estimation: Closed form estimator for 2-parameter model diff = with(nhefs.c, qsmk - pqsmk) diff2 = with(nhefs.c, wc * diff) lhs = matrix(0,2,2) lhs[1,1] = with(nhefs.c, sum(qsmk * diff2)) lhs[1,2] = with(nhefs.c, sum(qsmk * smokeintensity * diff2)) lhs[2,1] = with(nhefs.c, sum(qsmk * smokeintensity * diff2)) lhs[2,2] = with(nhefs.c, sum(qsmk * smokeintensity * smokeintensity * diff2)) rhs = matrix(0,2,1) rhs[1] = with(nhefs.c, sum(wt82_71 * diff2)) rhs[2] = with(nhefs.c, sum(wt82_71 * smokeintensity * diff2)) psi = t(solve(lhs,rhs)) psi #&gt; [,1] [,2] #&gt; [1,] 2.859 0.03004 "],["outcome-regression-and-propensity-scores.html", "15. Outcome regression and propensity scores Program 15.1 Program 15.2 Program 15.3 Program 15.4", " 15. Outcome regression and propensity scores Program 15.1 Estimating the average causal effect within levels of confounders under the assumption of effect-measure modification by smoking intensity ONLY Data from NHEFS library(here) #install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) # regression on covariates, allowing for some effect modification fit &lt;- glm(wt82_71 ~ qsmk + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71) + I(qsmk*smokeintensity), data=nhefs) summary(fit) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.5881657 4.3130359 -0.368 0.712756 #&gt; qsmk 2.5595941 0.8091486 3.163 0.001590 ** #&gt; sex -1.4302717 0.4689576 -3.050 0.002328 ** #&gt; race 0.5601096 0.5818888 0.963 0.335913 #&gt; age 0.3596353 0.1633188 2.202 0.027809 * #&gt; I(age * age) -0.0061010 0.0017261 -3.534 0.000421 *** #&gt; as.factor(education)2 0.7904440 0.6070005 1.302 0.193038 #&gt; as.factor(education)3 0.5563124 0.5561016 1.000 0.317284 #&gt; as.factor(education)4 1.4915695 0.8322704 1.792 0.073301 . #&gt; as.factor(education)5 -0.1949770 0.7413692 -0.263 0.792589 #&gt; smokeintensity 0.0491365 0.0517254 0.950 0.342287 #&gt; I(smokeintensity * smokeintensity) -0.0009907 0.0009380 -1.056 0.291097 #&gt; smokeyrs 0.1343686 0.0917122 1.465 0.143094 #&gt; I(smokeyrs * smokeyrs) -0.0018664 0.0015437 -1.209 0.226830 #&gt; as.factor(exercise)1 0.2959754 0.5351533 0.553 0.580298 #&gt; as.factor(exercise)2 0.3539128 0.5588587 0.633 0.526646 #&gt; as.factor(active)1 -0.9475695 0.4099344 -2.312 0.020935 * #&gt; as.factor(active)2 -0.2613779 0.6845577 -0.382 0.702647 #&gt; wt71 0.0455018 0.0833709 0.546 0.585299 #&gt; I(wt71 * wt71) -0.0009653 0.0005247 -1.840 0.066001 . #&gt; I(qsmk * smokeintensity) 0.0466628 0.0351448 1.328 0.184463 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.5683) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82763 on 1545 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 # (step 1) build the contrast matrix with all zeros # this function builds the blank matrix # install.packages(&quot;multcomp&quot;) # install packages if necessary library(&quot;multcomp&quot;) #&gt; Loading required package: mvtnorm #&gt; Loading required package: survival #&gt; Loading required package: TH.data #&gt; Loading required package: MASS #&gt; #&gt; Attaching package: &#39;TH.data&#39; #&gt; The following object is masked from &#39;package:MASS&#39;: #&gt; #&gt; geyser makeContrastMatrix &lt;- function(model, nrow, names) { m &lt;- matrix(0, nrow = nrow, ncol = length(coef(model))) colnames(m) &lt;- names(coef(model)) rownames(m) &lt;- names return(m) } K1 &lt;- makeContrastMatrix( fit, 2, c( &#39;Effect of Quitting Smoking at Smokeintensity of 5&#39;, &#39;Effect of Quitting Smoking at Smokeintensity of 40&#39; ) ) # (step 2) fill in the relevant non-zero elements K1[1:2, &#39;qsmk&#39;] &lt;- 1 K1[1:2, &#39;I(qsmk * smokeintensity)&#39;] &lt;- c(5, 40) # (step 3) check the contrast matrix K1 #&gt; (Intercept) qsmk sex race #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 1 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 1 0 0 #&gt; age I(age * age) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 0 #&gt; as.factor(education)2 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)3 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)4 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(education)5 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; smokeintensity #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(smokeintensity * smokeintensity) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; smokeyrs #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(smokeyrs * smokeyrs) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(exercise)1 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(exercise)2 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(active)1 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; as.factor(active)2 wt71 #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 0 #&gt; I(wt71 * wt71) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 0 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 0 #&gt; I(qsmk * smokeintensity) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 5 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 40 # (step 4) estimate the contrasts, get tests and confidence intervals for them estimates1 &lt;- glht(fit, K1) summary(estimates1) #&gt; #&gt; Simultaneous Tests for General Linear Hypotheses #&gt; #&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Linear Hypotheses: #&gt; Estimate Std. Error #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 2.7929 0.6683 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261 0.8478 #&gt; z value Pr(&gt;|z|) #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 4.179 5.84e-05 *** #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 5.221 3.56e-07 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; (Adjusted p values reported -- single-step method) confint(estimates1) #&gt; #&gt; Simultaneous Confidence Intervals #&gt; #&gt; Fit: glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), #&gt; data = nhefs) #&gt; #&gt; Quantile = 2.2281 #&gt; 95% family-wise confidence level #&gt; #&gt; #&gt; Linear Hypotheses: #&gt; Estimate lwr upr #&gt; Effect of Quitting Smoking at Smokeintensity of 5 == 0 2.7929 1.3039 4.2819 #&gt; Effect of Quitting Smoking at Smokeintensity of 40 == 0 4.4261 2.5372 6.3151 # regression on covariates, not allowing for effect modification fit2 &lt;- glm(wt82_71 ~ qsmk + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs) summary(fit2) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + #&gt; as.factor(education) + smokeintensity + I(smokeintensity * #&gt; smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -1.6586176 4.3137734 -0.384 0.700666 #&gt; qsmk 3.4626218 0.4384543 7.897 5.36e-15 *** #&gt; sex -1.4650496 0.4683410 -3.128 0.001792 ** #&gt; race 0.5864117 0.5816949 1.008 0.313560 #&gt; age 0.3626624 0.1633431 2.220 0.026546 * #&gt; I(age * age) -0.0061377 0.0017263 -3.555 0.000389 *** #&gt; as.factor(education)2 0.8185263 0.6067815 1.349 0.177546 #&gt; as.factor(education)3 0.5715004 0.5561211 1.028 0.304273 #&gt; as.factor(education)4 1.5085173 0.8323778 1.812 0.070134 . #&gt; as.factor(education)5 -0.1708264 0.7413289 -0.230 0.817786 #&gt; smokeintensity 0.0651533 0.0503115 1.295 0.195514 #&gt; I(smokeintensity * smokeintensity) -0.0010468 0.0009373 -1.117 0.264261 #&gt; smokeyrs 0.1333931 0.0917319 1.454 0.146104 #&gt; I(smokeyrs * smokeyrs) -0.0018270 0.0015438 -1.183 0.236818 #&gt; as.factor(exercise)1 0.3206824 0.5349616 0.599 0.548961 #&gt; as.factor(exercise)2 0.3628786 0.5589557 0.649 0.516300 #&gt; as.factor(active)1 -0.9429574 0.4100208 -2.300 0.021593 * #&gt; as.factor(active)2 -0.2580374 0.6847219 -0.377 0.706337 #&gt; wt71 0.0373642 0.0831658 0.449 0.653297 #&gt; I(wt71 * wt71) -0.0009158 0.0005235 -1.749 0.080426 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 53.59474) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 82857 on 1546 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10701 #&gt; #&gt; Number of Fisher Scoring iterations: 2 Program 15.2 Estimating and plotting the propensity score Data from NHEFS fit3 &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) summary(fit3) #&gt; #&gt; Call: #&gt; glm(formula = qsmk ~ sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smokeyrs + #&gt; I(smokeyrs * smokeyrs) + as.factor(exercise) + as.factor(active) + #&gt; wt71 + I(wt71 * wt71), family = binomial(), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) -1.9889022 1.2412792 -1.602 0.109089 #&gt; sex -0.5075218 0.1482316 -3.424 0.000617 *** #&gt; race -0.8502312 0.2058720 -4.130 3.63e-05 *** #&gt; age 0.1030132 0.0488996 2.107 0.035150 * #&gt; I(age * age) -0.0006052 0.0005074 -1.193 0.232973 #&gt; as.factor(education)2 -0.0983203 0.1906553 -0.516 0.606066 #&gt; as.factor(education)3 0.0156987 0.1707139 0.092 0.926730 #&gt; as.factor(education)4 -0.0425260 0.2642761 -0.161 0.872160 #&gt; as.factor(education)5 0.3796632 0.2203947 1.723 0.084952 . #&gt; smokeintensity -0.0651561 0.0147589 -4.415 1.01e-05 *** #&gt; I(smokeintensity * smokeintensity) 0.0008461 0.0002758 3.067 0.002160 ** #&gt; smokeyrs -0.0733708 0.0269958 -2.718 0.006571 ** #&gt; I(smokeyrs * smokeyrs) 0.0008384 0.0004435 1.891 0.058669 . #&gt; as.factor(exercise)1 0.2914117 0.1735543 1.679 0.093136 . #&gt; as.factor(exercise)2 0.3550517 0.1799293 1.973 0.048463 * #&gt; as.factor(active)1 0.0108754 0.1298320 0.084 0.933243 #&gt; as.factor(active)2 0.0683123 0.2087269 0.327 0.743455 #&gt; wt71 -0.0128478 0.0222829 -0.577 0.564226 #&gt; I(wt71 * wt71) 0.0001209 0.0001352 0.895 0.370957 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 1876.3 on 1628 degrees of freedom #&gt; Residual deviance: 1766.7 on 1610 degrees of freedom #&gt; AIC: 1804.7 #&gt; #&gt; Number of Fisher Scoring iterations: 4 nhefs$ps &lt;- predict(fit3, nhefs, type=&quot;response&quot;) summary(nhefs$ps[nhefs$qsmk==0]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.05298 0.16949 0.22747 0.24504 0.30441 0.65788 summary(nhefs$ps[nhefs$qsmk==1]) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.06248 0.22046 0.28897 0.31240 0.38122 0.79320 # # plotting the estimated propensity score # install.packages(&quot;ggplot2&quot;) # install packages if necessary # install.packages(&quot;dplyr&quot;) library(&quot;ggplot2&quot;) library(&quot;dplyr&quot;) #&gt; #&gt; Attaching package: &#39;dplyr&#39; #&gt; The following object is masked from &#39;package:MASS&#39;: #&gt; #&gt; select #&gt; The following objects are masked from &#39;package:stats&#39;: #&gt; #&gt; filter, lag #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; intersect, setdiff, setequal, union ggplot(nhefs, aes(x = ps, fill = qsmk)) + geom_density(alpha = 0.2) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;) #&gt; Warning: The following aesthetics were dropped during statistical transformation: fill. #&gt; ℹ This can happen when ggplot fails to infer the correct grouping structure in #&gt; the data. #&gt; ℹ Did you forget to specify a `group` aesthetic or to convert a numerical #&gt; variable into a factor? # alternative plot with histograms nhefs &lt;- nhefs %&gt;% mutate(qsmklabel = ifelse(qsmk == 1, yes = &#39;Quit Smoking 1971-1982&#39;, no = &#39;Did Not Quit Smoking 1971-1982&#39;)) ggplot(nhefs, aes(x = ps, fill = as.factor(qsmk), color = as.factor(qsmk))) + geom_histogram(alpha = 0.3, position = &#39;identity&#39;, bins=15) + facet_grid(as.factor(qsmk) ~ .) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + scale_color_discrete(&#39;&#39;) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;) # attempt to reproduce plot from the book nhefs %&gt;% mutate(ps.grp = round(ps/0.05) * 0.05) %&gt;% group_by(qsmk, ps.grp) %&gt;% summarize(n = n()) %&gt;% ungroup() %&gt;% mutate(n2 = ifelse(qsmk == 0, yes = n, no = -1*n)) %&gt;% ggplot(aes(x = ps.grp, y = n2, fill = as.factor(qsmk))) + geom_bar(stat = &#39;identity&#39;, position = &#39;identity&#39;) + geom_text(aes(label = n, x = ps.grp, y = n2 + ifelse(qsmk == 0, 8, -8))) + xlab(&#39;Probability of Quitting Smoking During Follow-up&#39;) + ylab(&#39;N&#39;) + ggtitle(&#39;Propensity Score Distribution by Treatment Group&#39;) + scale_fill_discrete(&#39;&#39;) + scale_x_continuous(breaks = seq(0, 1, 0.05)) + theme(legend.position = &#39;bottom&#39;, legend.direction = &#39;vertical&#39;, axis.ticks.y = element_blank(), axis.text.y = element_blank()) Program 15.3 Stratification on the propensity score Data from NHEFS # calculation of deciles nhefs$ps.dec &lt;- cut(nhefs$ps, breaks=c(quantile(nhefs$ps, probs=seq(0,1,0.1))), labels=seq(1:10), include.lowest=TRUE) #install.packages(&quot;psych&quot;) # install package if required library(&quot;psych&quot;) #&gt; #&gt; Attaching package: &#39;psych&#39; #&gt; The following objects are masked from &#39;package:ggplot2&#39;: #&gt; #&gt; %+%, alpha describeBy(nhefs$ps, list(nhefs$ps.dec, nhefs$qsmk)) #&gt; #&gt; Descriptive statistics by group #&gt; : 1 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 151 0.1 0.02 0.11 0.1 0.02 0.05 0.13 0.08 -0.55 -0.53 0 #&gt; ------------------------------------------------------------ #&gt; : 2 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 136 0.15 0.01 0.15 0.15 0.01 0.13 0.17 0.04 -0.04 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 3 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 134 0.18 0.01 0.18 0.18 0.01 0.17 0.19 0.03 -0.08 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 4 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 129 0.21 0.01 0.21 0.21 0.01 0.19 0.22 0.02 -0.04 -1.13 0 #&gt; ------------------------------------------------------------ #&gt; : 5 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 120 0.23 0.01 0.23 0.23 0.01 0.22 0.25 0.03 0.24 -1.22 0 #&gt; ------------------------------------------------------------ #&gt; : 6 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 117 0.26 0.01 0.26 0.26 0.01 0.25 0.27 0.03 -0.11 -1.29 0 #&gt; ------------------------------------------------------------ #&gt; : 7 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 120 0.29 0.01 0.29 0.29 0.01 0.27 0.31 0.03 -0.23 -1.19 0 #&gt; ------------------------------------------------------------ #&gt; : 8 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 112 0.33 0.01 0.33 0.33 0.02 0.31 0.35 0.04 0.15 -1.1 0 #&gt; ------------------------------------------------------------ #&gt; : 9 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 96 0.38 0.02 0.38 0.38 0.02 0.35 0.42 0.06 0.13 -1.15 0 #&gt; ------------------------------------------------------------ #&gt; : 10 #&gt; : 0 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 86 0.49 0.06 0.47 0.48 0.05 0.42 0.66 0.24 1.1 0.47 0.01 #&gt; ------------------------------------------------------------ #&gt; : 1 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 12 0.1 0.02 0.11 0.1 0.03 0.06 0.13 0.07 -0.5 -1.36 0.01 #&gt; ------------------------------------------------------------ #&gt; : 2 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 27 0.15 0.01 0.15 0.15 0.01 0.13 0.17 0.03 -0.03 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 3 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 29 0.18 0.01 0.18 0.18 0.01 0.17 0.19 0.03 0.01 -1.34 0 #&gt; ------------------------------------------------------------ #&gt; : 4 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 34 0.21 0.01 0.21 0.21 0.01 0.19 0.22 0.02 -0.31 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 5 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 43 0.23 0.01 0.23 0.23 0.01 0.22 0.25 0.03 0.11 -1.23 0 #&gt; ------------------------------------------------------------ #&gt; : 6 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 45 0.26 0.01 0.26 0.26 0.01 0.25 0.27 0.03 0.2 -1.12 0 #&gt; ------------------------------------------------------------ #&gt; : 7 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 43 0.29 0.01 0.29 0.29 0.01 0.27 0.31 0.03 0.16 -1.25 0 #&gt; ------------------------------------------------------------ #&gt; : 8 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 51 0.33 0.01 0.33 0.33 0.02 0.31 0.35 0.04 0.11 -1.19 0 #&gt; ------------------------------------------------------------ #&gt; : 9 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 67 0.38 0.02 0.38 0.38 0.03 0.35 0.42 0.06 0.19 -1.27 0 #&gt; ------------------------------------------------------------ #&gt; : 10 #&gt; : 1 #&gt; vars n mean sd median trimmed mad min max range skew kurtosis se #&gt; X1 1 77 0.52 0.08 0.51 0.51 0.08 0.42 0.79 0.38 0.88 0.81 0.01 # function to create deciles easily decile &lt;- function(x) { return(factor(quantcut(x, seq(0, 1, 0.1), labels = FALSE))) } # regression on PS deciles, allowing for effect modification for (deciles in c(1:10)) { print(t.test(wt82_71~qsmk, data=nhefs[which(nhefs$ps.dec==deciles),])) } #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = 0.0060506, df = 11.571, p-value = 0.9953 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.283903 5.313210 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 3.995205 3.980551 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.1117, df = 37.365, p-value = 0.003556 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.849335 -1.448161 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.904679 7.053426 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -4.5301, df = 35.79, p-value = 6.317e-05 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -9.474961 -3.613990 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.612094 9.156570 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.4117, df = 45.444, p-value = 0.1648 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.6831731 0.9985715 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 3.474679 5.816979 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.1371, df = 74.249, p-value = 0.002446 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.753621 -1.507087 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.098800 6.229154 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -2.1677, df = 50.665, p-value = 0.0349 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -8.7516605 -0.3350127 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 1.847004 6.390340 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -3.3155, df = 84.724, p-value = 0.001348 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.904207 -1.727590 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 1.560048 5.875946 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -2.664, df = 75.306, p-value = 0.009441 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -6.2396014 -0.9005605 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 0.2846851 3.8547661 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.9122, df = 129.12, p-value = 0.05806 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -4.68143608 0.07973698 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; -0.8954482 1.4054014 #&gt; #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by qsmk #&gt; t = -1.5925, df = 142.72, p-value = 0.1135 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -5.0209284 0.5404697 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; -0.5043766 1.7358528 # regression on PS deciles, not allowing for effect modification fit.psdec &lt;- glm(wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs) summary(fit.psdec) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + as.factor(ps.dec), data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 3.7505 0.6089 6.159 9.29e-10 *** #&gt; qsmk 3.5005 0.4571 7.659 3.28e-14 *** #&gt; as.factor(ps.dec)2 -0.7391 0.8611 -0.858 0.3908 #&gt; as.factor(ps.dec)3 -0.6182 0.8612 -0.718 0.4730 #&gt; as.factor(ps.dec)4 -0.5204 0.8584 -0.606 0.5444 #&gt; as.factor(ps.dec)5 -1.4884 0.8590 -1.733 0.0834 . #&gt; as.factor(ps.dec)6 -1.6227 0.8675 -1.871 0.0616 . #&gt; as.factor(ps.dec)7 -1.9853 0.8681 -2.287 0.0223 * #&gt; as.factor(ps.dec)8 -3.4447 0.8749 -3.937 8.61e-05 *** #&gt; as.factor(ps.dec)9 -5.1544 0.8848 -5.825 6.91e-09 *** #&gt; as.factor(ps.dec)10 -4.8403 0.8828 -5.483 4.87e-08 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 58.42297) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 90848 on 1555 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10827 #&gt; #&gt; Number of Fisher Scoring iterations: 2 confint.lm(fit.psdec) #&gt; 2.5 % 97.5 % #&gt; (Intercept) 2.556098 4.94486263 #&gt; qsmk 2.603953 4.39700504 #&gt; as.factor(ps.dec)2 -2.428074 0.94982494 #&gt; as.factor(ps.dec)3 -2.307454 1.07103569 #&gt; as.factor(ps.dec)4 -2.204103 1.16333143 #&gt; as.factor(ps.dec)5 -3.173337 0.19657938 #&gt; as.factor(ps.dec)6 -3.324345 0.07893027 #&gt; as.factor(ps.dec)7 -3.688043 -0.28248110 #&gt; as.factor(ps.dec)8 -5.160862 -1.72860113 #&gt; as.factor(ps.dec)9 -6.889923 -3.41883853 #&gt; as.factor(ps.dec)10 -6.571789 -3.10873731 Program 15.4 Standardization using the propensity score Data from NHEFS #install.packages(&quot;boot&quot;) # install package if required library(&quot;boot&quot;) #&gt; #&gt; Attaching package: &#39;boot&#39; #&gt; The following object is masked from &#39;package:psych&#39;: #&gt; #&gt; logit #&gt; The following object is masked from &#39;package:survival&#39;: #&gt; #&gt; aml # standardization by propensity score, agnostic regarding effect modification std.ps &lt;- function(data, indices) { d &lt;- data[indices,] # 1st copy: equal to original one` # calculating propensity scores ps.fit &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=d, family=binomial()) d$pscore &lt;- predict(ps.fit, d, type=&quot;response&quot;) # create a dataset with 3 copies of each subject d$interv &lt;- -1 # 1st copy: equal to original one` d0 &lt;- d # 2nd copy: treatment set to 0, outcome to missing d0$interv &lt;- 0 d0$qsmk &lt;- 0 d0$wt82_71 &lt;- NA d1 &lt;- d # 3rd copy: treatment set to 1, outcome to missing d1$interv &lt;- 1 d1$qsmk &lt;- 1 d1$wt82_71 &lt;- NA d.onesample &lt;- rbind(d, d0, d1) # combining datasets std.fit &lt;- glm(wt82_71 ~ qsmk + pscore + I(qsmk*pscore), data=d.onesample) d.onesample$predicted_meanY &lt;- predict(std.fit, d.onesample) # estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1 return(c(mean(d.onesample$predicted_meanY[d.onesample$interv==-1]), mean(d.onesample$predicted_meanY[d.onesample$interv==0]), mean(d.onesample$predicted_meanY[d.onesample$interv==1]), mean(d.onesample$predicted_meanY[d.onesample$interv==1])- mean(d.onesample$predicted_meanY[d.onesample$interv==0]))) } # bootstrap results &lt;- boot(data=nhefs, statistic=std.ps, R=5) # generating confidence intervals se &lt;- c(sd(results$t[,1]), sd(results$t[,2]), sd(results$t[,3]), sd(results$t[,4])) mean &lt;- results$t0 ll &lt;- mean - qnorm(0.975)*se ul &lt;- mean + qnorm(0.975)*se bootstrap &lt;- data.frame(cbind(c(&quot;Observed&quot;, &quot;No Treatment&quot;, &quot;Treatment&quot;, &quot;Treatment - No Treatment&quot;), mean, se, ll, ul)) bootstrap #&gt; V1 mean se ll #&gt; 1 Observed 2.63384609228479 0.257431993398983 2.12928865675443 #&gt; 2 No Treatment 1.71983636149845 0.231785902506788 1.26554434046104 #&gt; 3 Treatment 5.35072300362985 0.248611665961784 4.86345309220825 #&gt; 4 Treatment - No Treatment 3.6308866421314 0.284117716001535 3.07402615139861 #&gt; ul #&gt; 1 3.13840352781515 #&gt; 2 2.17412838253587 #&gt; 3 5.83799291505145 #&gt; 4 4.18774713286419 # regression on the propensity score (linear term) model6 &lt;- glm(wt82_71 ~ qsmk + ps, data = nhefs) # p.qsmk summary(model6) #&gt; #&gt; Call: #&gt; glm(formula = wt82_71 ~ qsmk + ps, data = nhefs) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 5.5945 0.4831 11.581 &lt; 2e-16 *** #&gt; qsmk 3.5506 0.4573 7.765 1.47e-14 *** #&gt; ps -14.8218 1.7576 -8.433 &lt; 2e-16 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for gaussian family taken to be 58.28455) #&gt; #&gt; Null deviance: 97176 on 1565 degrees of freedom #&gt; Residual deviance: 91099 on 1563 degrees of freedom #&gt; (63 observations deleted due to missingness) #&gt; AIC: 10815 #&gt; #&gt; Number of Fisher Scoring iterations: 2 # standarization on the propensity score # (step 1) create two new datasets, one with all treated and one with all untreated treated &lt;- nhefs treated$qsmk &lt;- 1 untreated &lt;- nhefs untreated$qsmk &lt;- 0 # (step 2) predict values for everyone in each new dataset based on above model treated$pred.y &lt;- predict(model6, treated) untreated$pred.y &lt;- predict(model6, untreated) # (step 3) compare mean weight loss had all been treated vs. that had all been untreated mean1 &lt;- mean(treated$pred.y, na.rm = TRUE) mean0 &lt;- mean(untreated$pred.y, na.rm = TRUE) mean1 #&gt; [1] 5.250824 mean0 #&gt; [1] 1.700228 mean1 - mean0 #&gt; [1] 3.550596 # (step 4) bootstrap a confidence interval # number of bootstraps nboot &lt;- 100 # set up a matrix to store results boots &lt;- data.frame(i = 1:nboot, mean1 = NA, mean0 = NA, difference = NA) # loop to perform the bootstrapping nhefs &lt;- subset(nhefs, !is.na(ps) &amp; !is.na(wt82_71)) # p.qsmk for(i in 1:nboot) { # sample with replacement sampl &lt;- nhefs[sample(1:nrow(nhefs), nrow(nhefs), replace = TRUE), ] # fit the model in the bootstrap sample bootmod &lt;- glm(wt82_71 ~ qsmk + ps, data = sampl) # ps # create new datasets sampl.treated &lt;- sampl %&gt;% mutate(qsmk = 1) sampl.untreated &lt;- sampl %&gt;% mutate(qsmk = 0) # predict values sampl.treated$pred.y &lt;- predict(bootmod, sampl.treated) sampl.untreated$pred.y &lt;- predict(bootmod, sampl.untreated) # output results boots[i, &#39;mean1&#39;] &lt;- mean(sampl.treated$pred.y, na.rm = TRUE) boots[i, &#39;mean0&#39;] &lt;- mean(sampl.untreated$pred.y, na.rm = TRUE) boots[i, &#39;difference&#39;] &lt;- boots[i, &#39;mean1&#39;] - boots[i, &#39;mean0&#39;] # once loop is done, print the results if(i == nboot) { cat(&#39;95% CI for the causal mean difference\\n&#39;) cat(mean(boots$difference) - 1.96*sd(boots$difference), &#39;,&#39;, mean(boots$difference) + 1.96*sd(boots$difference)) } } #&gt; 95% CI for the causal mean difference #&gt; 2.585806 , 4.616634 A more flexible and elegant way to do this is to write a function to perform the model fitting, prediction, bootstrapping, and reporting all at once. "],["instrumental-variables-estimation.html", "16. Instrumental variables estimation Program 16.1 Program 16.2 Program 16.3 Program 16.4 Program 16.5", " 16. Instrumental variables estimation Program 16.1 Estimating the average causal using the standard IV estimator via the calculation of sample averages Data from NHEFS library(here) #install.packages(&quot;readxl&quot;) # install package if required library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$cens &lt;- ifelse(is.na(nhefs$wt82), 1, 0) summary(nhefs$price82) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. NA&#39;s #&gt; 1.452 1.740 1.815 1.806 1.868 2.103 92 # for simplicity, ignore subjects with missing outcome or missing instrument nhefs.iv &lt;- nhefs[which(!is.na(nhefs$wt82) &amp; !is.na(nhefs$price82)),] nhefs.iv$highprice &lt;- ifelse(nhefs.iv$price82&gt;=1.5, 1, 0) table(nhefs.iv$highprice, nhefs.iv$qsmk) #&gt; #&gt; 0 1 #&gt; 0 33 8 #&gt; 1 1065 370 t.test(wt82_71 ~ highprice, data=nhefs.iv) #&gt; #&gt; Welch Two Sample t-test #&gt; #&gt; data: wt82_71 by highprice #&gt; t = -0.10179, df = 41.644, p-value = 0.9194 #&gt; alternative hypothesis: true difference in means between group 0 and group 1 is not equal to 0 #&gt; 95 percent confidence interval: #&gt; -3.130588 2.830010 #&gt; sample estimates: #&gt; mean in group 0 mean in group 1 #&gt; 2.535729 2.686018 Program 16.2 Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression Data from NHEFS #install.packages (&quot;sem&quot;) # install package if required library(sem) model1 &lt;- tsls(wt82_71 ~ qsmk, ~ highprice, data = nhefs.iv) summary(model1) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~highprice #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -43.34863 -4.00206 -0.02712 0.00000 4.17040 46.47022 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 2.068164 5.085098 0.40671 0.68428 #&gt; qsmk 2.396270 19.840037 0.12078 0.90388 #&gt; #&gt; Residual standard error: 7.8561141 on 1474 degrees of freedom confint(model1) # note the wide confidence intervals #&gt; 2.5 % 97.5 % #&gt; (Intercept) -7.898445 12.03477 #&gt; qsmk -36.489487 41.28203 Program 16.3 Estimating the average causal using the standard IV estimator via additive marginal structural models Data from NHEFS G-estimation: Checking one possible value of psi See Chapter 14 for program that checks several values and computes 95% confidence intervals nhefs.iv$psi &lt;- 2.396 nhefs.iv$Hpsi &lt;- nhefs.iv$wt82_71-nhefs.iv$psi*nhefs.iv$qsmk #install.packages(&quot;geepack&quot;) # install package if required library(&quot;geepack&quot;) g.est &lt;- geeglm(highprice ~ Hpsi, data=nhefs.iv, id=seqn, family=binomial(), corstr=&quot;independence&quot;) summary(g.est) #&gt; #&gt; Call: #&gt; geeglm(formula = highprice ~ Hpsi, family = binomial(), data = nhefs.iv, #&gt; id = seqn, corstr = &quot;independence&quot;) #&gt; #&gt; Coefficients: #&gt; Estimate Std.err Wald Pr(&gt;|W|) #&gt; (Intercept) 3.555e+00 1.652e-01 463.1 &lt;2e-16 *** #&gt; Hpsi 2.748e-07 2.273e-02 0.0 1 #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Correlation structure = independence #&gt; Estimated Scale Parameters: #&gt; #&gt; Estimate Std.err #&gt; (Intercept) 1 0.7607 #&gt; Number of clusters: 1476 Maximum cluster size: 1 beta &lt;- coef(g.est) SE &lt;- coef(summary(g.est))[,2] lcl &lt;- beta-qnorm(0.975)*SE ucl &lt;- beta+qnorm(0.975)*SE cbind(beta, lcl, ucl) #&gt; beta lcl ucl #&gt; (Intercept) 3.555e+00 3.23152 3.87917 #&gt; Hpsi 2.748e-07 -0.04456 0.04456 Program 16.4 Estimating the average causal using the standard IV estimator with altnerative proposed instruments Data from NHEFS summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.6, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.6, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -55.6 -13.5 7.6 0.0 12.5 56.4 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) -7.89 42.25 -0.187 0.852 #&gt; qsmk 41.28 164.95 0.250 0.802 #&gt; #&gt; Residual standard error: 18.6055 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.7, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.7, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -54.4 -13.4 -8.4 0.0 18.1 75.3 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 13.16 48.08 0.274 0.784 #&gt; qsmk -40.91 187.74 -0.218 0.828 #&gt; #&gt; Residual standard error: 20.591 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.8, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.8, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -49.37 -8.31 -3.44 0.00 7.27 60.53 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 8.086 7.288 1.110 0.267 #&gt; qsmk -21.103 28.428 -0.742 0.458 #&gt; #&gt; Residual standard error: 13.0188 on 1474 degrees of freedom summary(tsls(wt82_71 ~ qsmk, ~ ifelse(price82 &gt;= 1.9, 1, 0), data = nhefs.iv)) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk #&gt; #&gt; Instruments: ~ifelse(price82 &gt;= 1.9, 1, 0) #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -47.24 -6.33 -1.43 0.00 5.52 54.36 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 5.963 6.067 0.983 0.326 #&gt; qsmk -12.811 23.667 -0.541 0.588 #&gt; #&gt; Residual standard error: 10.3637 on 1474 degrees of freedom Program 16.5 Estimating the average causal using the standard IV estimator Conditional on baseline covariates Data from NHEFS model2 &lt;- tsls(wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + as.factor(active) + wt71, ~ highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + as.factor(active) + wt71, data = nhefs.iv) summary(model2) #&gt; #&gt; 2SLS Estimates #&gt; #&gt; Model Formula: wt82_71 ~ qsmk + sex + race + age + smokeintensity + smokeyrs + #&gt; as.factor(exercise) + as.factor(active) + wt71 #&gt; #&gt; Instruments: ~highprice + sex + race + age + smokeintensity + smokeyrs + as.factor(exercise) + #&gt; as.factor(active) + wt71 #&gt; #&gt; Residuals: #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; -42.23 -4.29 -0.62 0.00 3.87 46.74 #&gt; #&gt; Estimate Std. Error t value Pr(&gt;|t|) #&gt; (Intercept) 17.280330 2.335402 7.399 2.3e-13 *** #&gt; qsmk -1.042295 29.987369 -0.035 0.9723 #&gt; sex -1.644393 2.630831 -0.625 0.5320 #&gt; race -0.183255 4.650386 -0.039 0.9686 #&gt; age -0.163640 0.240548 -0.680 0.4964 #&gt; smokeintensity 0.005767 0.145504 0.040 0.9684 #&gt; smokeyrs 0.025836 0.161421 0.160 0.8729 #&gt; as.factor(exercise)1 0.498748 2.171239 0.230 0.8184 #&gt; as.factor(exercise)2 0.581834 2.183148 0.267 0.7899 #&gt; as.factor(active)1 -1.170145 0.607466 -1.926 0.0543 . #&gt; as.factor(active)2 -0.512284 1.308451 -0.392 0.6955 #&gt; wt71 -0.097949 0.036271 -2.701 0.0070 ** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; Residual standard error: 7.7162 on 1464 degrees of freedom "],["causal-survival-analysis.html", "17. Causal survival analysis Program 17.1 Program 17.2 Program 17.3 Program 17.4 Program 17.5", " 17. Causal survival analysis Program 17.1 Nonparametric estimation of survival curves Data from NHEFS library(here) library(&quot;readxl&quot;) nhefs &lt;- read_excel(here(&quot;data&quot;,&quot;NHEFS.xls&quot;)) # some preprocessing of the data nhefs$survtime &lt;- ifelse(nhefs$death==0, 120, (nhefs$yrdth-83)*12+nhefs$modth) # yrdth ranges from 83 to 92 table(nhefs$death, nhefs$qsmk) #&gt; #&gt; 0 1 #&gt; 0 985 326 #&gt; 1 216 102 summary(nhefs[which(nhefs$death==1),]$survtime) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 1.00 35.00 61.00 61.14 86.75 120.00 #install.packages(&quot;survival&quot;) #install.packages(&quot;ggplot2&quot;) # for plots #install.packages(&quot;survminer&quot;) # for plots library(&quot;survival&quot;) library(&quot;ggplot2&quot;) library(&quot;survminer&quot;) #&gt; Loading required package: ggpubr #&gt; #&gt; Attaching package: &#39;survminer&#39; #&gt; The following object is masked from &#39;package:survival&#39;: #&gt; #&gt; myeloma survdiff(Surv(survtime, death) ~ qsmk, data=nhefs) #&gt; Call: #&gt; survdiff(formula = Surv(survtime, death) ~ qsmk, data = nhefs) #&gt; #&gt; N Observed Expected (O-E)^2/E (O-E)^2/V #&gt; qsmk=0 1201 216 237.5 1.95 7.73 #&gt; qsmk=1 428 102 80.5 5.76 7.73 #&gt; #&gt; Chisq= 7.7 on 1 degrees of freedom, p= 0.005 fit &lt;- survfit(Surv(survtime, death) ~ qsmk, data=nhefs) ggsurvplot(fit, data = nhefs, xlab=&quot;Months of follow-up&quot;, ylab=&quot;Survival probability&quot;, main=&quot;Product-Limit Survival Estimates&quot;, risk.table = TRUE) Program 17.2 Parametric estimation of survival curves via hazards model Data from NHEFS # creation of person-month data #install.packages(&quot;splitstackshape&quot;) library(&quot;splitstackshape&quot;) nhefs.surv &lt;- expandRows(nhefs, &quot;survtime&quot;, drop=F) nhefs.surv$time &lt;- sequence(rle(nhefs.surv$seqn)$lengths)-1 nhefs.surv$event &lt;- ifelse(nhefs.surv$time==nhefs.surv$survtime-1 &amp; nhefs.surv$death==1, 1, 0) nhefs.surv$timesq &lt;- nhefs.surv$time^2 # fit of parametric hazards model hazards.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq, family=binomial(), data=nhefs.surv) summary(hazards.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq, family = binomial(), data = nhefs.surv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 6.996e+00 2.309e-01 30.292 &lt;2e-16 *** #&gt; qsmk -3.355e-01 3.970e-01 -0.845 0.3981 #&gt; I(qsmk * time) -1.208e-02 1.503e-02 -0.804 0.4215 #&gt; I(qsmk * timesq) 1.612e-04 1.246e-04 1.293 0.1960 #&gt; time -1.960e-02 8.413e-03 -2.329 0.0198 * #&gt; timesq 1.256e-04 6.686e-05 1.878 0.0604 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4655.3 on 176763 degrees of freedom #&gt; Residual deviance: 4631.3 on 176758 degrees of freedom #&gt; AIC: 4643.3 #&gt; #&gt; Number of Fisher Scoring iterations: 9 # creation of dataset with all time points under each treatment level qsmk0 &lt;- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2)) qsmk1 &lt;- data.frame(cbind(seq(0, 119),1,(seq(0, 119))^2)) colnames(qsmk0) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) colnames(qsmk1) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) # assignment of estimated (1-hazard) to each person-month */ qsmk0$p.noevent0 &lt;- predict(hazards.model, qsmk0, type=&quot;response&quot;) qsmk1$p.noevent1 &lt;- predict(hazards.model, qsmk1, type=&quot;response&quot;) # computation of survival for each person-month qsmk0$surv0 &lt;- cumprod(qsmk0$p.noevent0) qsmk1$surv1 &lt;- cumprod(qsmk1$p.noevent1) # some data management to plot estimated survival curves hazards.graph &lt;- merge(qsmk0, qsmk1, by=c(&quot;time&quot;, &quot;timesq&quot;)) hazards.graph$survdiff &lt;- hazards.graph$surv1-hazards.graph$surv0 # plot ggplot(hazards.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from hazards model&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.3 Estimation of survival curves via IP weighted hazards model Data from NHEFS # estimation of denominator of ip weights p.denom &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) nhefs$pd.qsmk &lt;- predict(p.denom, nhefs, type=&quot;response&quot;) # estimation of numerator of ip weights p.num &lt;- glm(qsmk ~ 1, data=nhefs, family=binomial()) nhefs$pn.qsmk &lt;- predict(p.num, nhefs, type=&quot;response&quot;) # computation of estimated weights nhefs$sw.a &lt;- ifelse(nhefs$qsmk==1, nhefs$pn.qsmk/nhefs$pd.qsmk, (1-nhefs$pn.qsmk)/(1-nhefs$pd.qsmk)) summary(nhefs$sw.a) #&gt; Min. 1st Qu. Median Mean 3rd Qu. Max. #&gt; 0.3312 0.8640 0.9504 0.9991 1.0755 4.2054 # creation of person-month data nhefs.ipw &lt;- expandRows(nhefs, &quot;survtime&quot;, drop=F) nhefs.ipw$time &lt;- sequence(rle(nhefs.ipw$seqn)$lengths)-1 nhefs.ipw$event &lt;- ifelse(nhefs.ipw$time==nhefs.ipw$survtime-1 &amp; nhefs.ipw$death==1, 1, 0) nhefs.ipw$timesq &lt;- nhefs.ipw$time^2 # fit of weighted hazards model ipw.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq, family=binomial(), weight=sw.a, data=nhefs.ipw) #&gt; Warning in eval(family$initialize): non-integer #successes in a binomial glm! summary(ipw.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq, family = binomial(), data = nhefs.ipw, weights = sw.a) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 6.897e+00 2.208e-01 31.242 &lt;2e-16 *** #&gt; qsmk 1.794e-01 4.399e-01 0.408 0.6834 #&gt; I(qsmk * time) -1.895e-02 1.640e-02 -1.155 0.2481 #&gt; I(qsmk * timesq) 2.103e-04 1.352e-04 1.556 0.1198 #&gt; time -1.889e-02 8.053e-03 -2.345 0.0190 * #&gt; timesq 1.181e-04 6.399e-05 1.846 0.0649 . #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4643.9 on 176763 degrees of freedom #&gt; Residual deviance: 4626.2 on 176758 degrees of freedom #&gt; AIC: 4633.5 #&gt; #&gt; Number of Fisher Scoring iterations: 9 # creation of survival curves ipw.qsmk0 &lt;- data.frame(cbind(seq(0, 119),0,(seq(0, 119))^2)) ipw.qsmk1 &lt;- data.frame(cbind(seq(0, 119),1,(seq(0, 119))^2)) colnames(ipw.qsmk0) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) colnames(ipw.qsmk1) &lt;- c(&quot;time&quot;, &quot;qsmk&quot;, &quot;timesq&quot;) # assignment of estimated (1-hazard) to each person-month */ ipw.qsmk0$p.noevent0 &lt;- predict(ipw.model, ipw.qsmk0, type=&quot;response&quot;) ipw.qsmk1$p.noevent1 &lt;- predict(ipw.model, ipw.qsmk1, type=&quot;response&quot;) # computation of survival for each person-month ipw.qsmk0$surv0 &lt;- cumprod(ipw.qsmk0$p.noevent0) ipw.qsmk1$surv1 &lt;- cumprod(ipw.qsmk1$p.noevent1) # some data management to plot estimated survival curves ipw.graph &lt;- merge(ipw.qsmk0, ipw.qsmk1, by=c(&quot;time&quot;, &quot;timesq&quot;)) ipw.graph$survdiff &lt;- ipw.graph$surv1-ipw.graph$surv0 # plot ggplot(ipw.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from IP weighted hazards model&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.4 Estimating of survival curves via g-formula Data from NHEFS # fit of hazards model with covariates gf.model &lt;- glm(event==0 ~ qsmk + I(qsmk*time) + I(qsmk*timesq) + time + timesq + sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smkintensity82_71 + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs.surv, family=binomial()) summary(gf.model) #&gt; #&gt; Call: #&gt; glm(formula = event == 0 ~ qsmk + I(qsmk * time) + I(qsmk * timesq) + #&gt; time + timesq + sex + race + age + I(age * age) + as.factor(education) + #&gt; smokeintensity + I(smokeintensity * smokeintensity) + smkintensity82_71 + #&gt; smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + #&gt; as.factor(active) + wt71 + I(wt71 * wt71), family = binomial(), #&gt; data = nhefs.surv) #&gt; #&gt; Coefficients: #&gt; Estimate Std. Error z value Pr(&gt;|z|) #&gt; (Intercept) 9.272e+00 1.379e+00 6.724 1.76e-11 *** #&gt; qsmk 5.959e-02 4.154e-01 0.143 0.885924 #&gt; I(qsmk * time) -1.485e-02 1.506e-02 -0.987 0.323824 #&gt; I(qsmk * timesq) 1.702e-04 1.245e-04 1.367 0.171643 #&gt; time -2.270e-02 8.437e-03 -2.690 0.007142 ** #&gt; timesq 1.174e-04 6.709e-05 1.751 0.080020 . #&gt; sex 4.368e-01 1.409e-01 3.101 0.001930 ** #&gt; race -5.240e-02 1.734e-01 -0.302 0.762572 #&gt; age -8.750e-02 5.907e-02 -1.481 0.138536 #&gt; I(age * age) 8.128e-05 5.470e-04 0.149 0.881865 #&gt; as.factor(education)2 1.401e-01 1.566e-01 0.895 0.370980 #&gt; as.factor(education)3 4.335e-01 1.526e-01 2.841 0.004502 ** #&gt; as.factor(education)4 2.350e-01 2.790e-01 0.842 0.399750 #&gt; as.factor(education)5 3.750e-01 2.386e-01 1.571 0.116115 #&gt; smokeintensity -1.626e-03 1.430e-02 -0.114 0.909431 #&gt; I(smokeintensity * smokeintensity) -7.182e-05 2.390e-04 -0.301 0.763741 #&gt; smkintensity82_71 -1.686e-03 6.501e-03 -0.259 0.795399 #&gt; smokeyrs -1.677e-02 3.065e-02 -0.547 0.584153 #&gt; I(smokeyrs * smokeyrs) -5.280e-05 4.244e-04 -0.124 0.900997 #&gt; as.factor(exercise)1 1.469e-01 1.792e-01 0.820 0.412300 #&gt; as.factor(exercise)2 -1.504e-01 1.762e-01 -0.854 0.393177 #&gt; as.factor(active)1 -1.601e-01 1.300e-01 -1.232 0.218048 #&gt; as.factor(active)2 -2.294e-01 1.877e-01 -1.222 0.221766 #&gt; wt71 6.222e-02 1.902e-02 3.271 0.001073 ** #&gt; I(wt71 * wt71) -4.046e-04 1.129e-04 -3.584 0.000338 *** #&gt; --- #&gt; Signif. codes: 0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1 #&gt; #&gt; (Dispersion parameter for binomial family taken to be 1) #&gt; #&gt; Null deviance: 4655.3 on 176763 degrees of freedom #&gt; Residual deviance: 4185.7 on 176739 degrees of freedom #&gt; AIC: 4235.7 #&gt; #&gt; Number of Fisher Scoring iterations: 10 # creation of dataset with all time points for # each individual under each treatment level gf.qsmk0 &lt;- expandRows(nhefs, count=120, count.is.col=F) gf.qsmk0$time &lt;- rep(seq(0, 119), nrow(nhefs)) gf.qsmk0$timesq &lt;- gf.qsmk0$time^2 gf.qsmk0$qsmk &lt;- 0 gf.qsmk1 &lt;- gf.qsmk0 gf.qsmk1$qsmk &lt;- 1 gf.qsmk0$p.noevent0 &lt;- predict(gf.model, gf.qsmk0, type=&quot;response&quot;) gf.qsmk1$p.noevent1 &lt;- predict(gf.model, gf.qsmk1, type=&quot;response&quot;) #install.packages(&quot;dplyr&quot;) library(&quot;dplyr&quot;) #&gt; #&gt; Attaching package: &#39;dplyr&#39; #&gt; The following objects are masked from &#39;package:stats&#39;: #&gt; #&gt; filter, lag #&gt; The following objects are masked from &#39;package:base&#39;: #&gt; #&gt; intersect, setdiff, setequal, union gf.qsmk0.surv &lt;- gf.qsmk0 %&gt;% group_by(seqn) %&gt;% mutate(surv0 = cumprod(p.noevent0)) gf.qsmk1.surv &lt;- gf.qsmk1 %&gt;% group_by(seqn) %&gt;% mutate(surv1 = cumprod(p.noevent1)) gf.surv0 &lt;- aggregate(gf.qsmk0.surv, by = list(gf.qsmk0.surv$time), FUN = mean)[c(&quot;qsmk&quot;, &quot;time&quot;, &quot;surv0&quot;)] gf.surv1 &lt;- aggregate(gf.qsmk1.surv, by = list(gf.qsmk1.surv$time), FUN = mean)[c(&quot;qsmk&quot;, &quot;time&quot;, &quot;surv1&quot;)] gf.graph &lt;- merge(gf.surv0, gf.surv1, by=c(&quot;time&quot;)) gf.graph$survdiff &lt;- gf.graph$surv1-gf.graph$surv0 # plot ggplot(gf.graph, aes(x=time, y=surv)) + geom_line(aes(y = surv0, colour = &quot;0&quot;)) + geom_line(aes(y = surv1, colour = &quot;1&quot;)) + xlab(&quot;Months&quot;) + scale_x_continuous(limits = c(0, 120), breaks=seq(0,120,12)) + scale_y_continuous(limits=c(0.6, 1), breaks=seq(0.6, 1, 0.2)) + ylab(&quot;Survival&quot;) + ggtitle(&quot;Survival from g-formula&quot;) + labs(colour=&quot;A:&quot;) + theme_bw() + theme(legend.position=&quot;bottom&quot;) Program 17.5 Estimating of median survival time ratio via a structural nested AFT model Data from NHEFS # some preprocessing of the data nhefs &lt;- read_excel(here(&quot;data&quot;, &quot;NHEFS.xls&quot;)) nhefs$survtime &lt;- ifelse(nhefs$death == 0, NA, (nhefs$yrdth - 83) * 12 + nhefs$modth) # * yrdth ranges from 83 to 92 # model to estimate E[A|L] modelA &lt;- glm(qsmk ~ sex + race + age + I(age*age) + as.factor(education) + smokeintensity + I(smokeintensity*smokeintensity) + smokeyrs + I(smokeyrs*smokeyrs) + as.factor(exercise) + as.factor(active) + wt71 + I(wt71*wt71), data=nhefs, family=binomial()) nhefs$p.qsmk &lt;- predict(modelA, nhefs, type=&quot;response&quot;) d &lt;- nhefs[!is.na(nhefs$survtime),] # select only those with observed death time n &lt;- nrow(d) # define the estimating function that needs to be minimized sumeef &lt;- function(psi){ # creation of delta indicator if (psi&gt;=0){ delta &lt;- ifelse(d$qsmk==0 | (d$qsmk==1 &amp; psi &lt;= log(120/d$survtime)), 1, 0) } else if (psi &lt; 0) { delta &lt;- ifelse(d$qsmk==1 | (d$qsmk==0 &amp; psi &gt; log(d$survtime/120)), 1, 0) } smat &lt;- delta*(d$qsmk-d$p.qsmk) sval &lt;- sum(smat, na.rm=T) save &lt;- sval/n smat &lt;- smat - rep(save, n) # covariance sigma &lt;- t(smat) %*% smat if (sigma == 0){ sigma &lt;- 1e-16 } estimeq &lt;- sval*solve(sigma)*t(sval) return(estimeq) } res &lt;- optimize(sumeef, interval = c(-0.2,0.2)) psi1 &lt;- res$minimum objfunc &lt;- as.numeric(res$objective) # Use simple bisection method to find estimates of lower and upper 95% confidence bounds increm &lt;- 0.1 for_conf &lt;- function(x){ return(sumeef(x) - 3.84) } if (objfunc &lt; 3.84){ # Find estimate of where sumeef(x) &gt; 3.84 # Lower bound of 95% CI psilow &lt;- psi1 testlow &lt;- objfunc countlow &lt;- 0 while (testlow &lt; 3.84 &amp; countlow &lt; 100){ psilow &lt;- psilow - increm testlow &lt;- sumeef(psilow) countlow &lt;- countlow + 1 } # Upper bound of 95% CI psihigh &lt;- psi1 testhigh &lt;- objfunc counthigh &lt;- 0 while (testhigh &lt; 3.84 &amp; counthigh &lt; 100){ psihigh &lt;- psihigh + increm testhigh &lt;- sumeef(psihigh) counthigh &lt;- counthigh + 1 } # Better estimate using bisection method if ((testhigh &gt; 3.84) &amp; (testlow &gt; 3.84)){ # Bisection method left &lt;- psi1 fleft &lt;- objfunc - 3.84 right &lt;- psihigh fright &lt;- testhigh - 3.84 middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- 0 diff &lt;- right - left while (!(abs(fmiddle) &lt; 0.0001 | diff &lt; 0.0001 | count &gt; 100)){ test &lt;- fmiddle * fleft if (test &lt; 0){ right &lt;- middle fright &lt;- fmiddle } else { left &lt;- middle fleft &lt;- fmiddle } middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- count + 1 diff &lt;- right - left } psi_high &lt;- middle objfunc_high &lt;- fmiddle + 3.84 # lower bound of 95% CI left &lt;- psilow fleft &lt;- testlow - 3.84 right &lt;- psi1 fright &lt;- objfunc - 3.84 middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) count &lt;- 0 diff &lt;- right - left while(!(abs(fmiddle) &lt; 0.0001 | diff &lt; 0.0001 | count &gt; 100)){ test &lt;- fmiddle * fleft if (test &lt; 0){ right &lt;- middle fright &lt;- fmiddle } else { left &lt;- middle fleft &lt;- fmiddle } middle &lt;- (left + right) / 2 fmiddle &lt;- for_conf(middle) diff &lt;- right - left count &lt;- count + 1 } psi_low &lt;- middle objfunc_low &lt;- fmiddle + 3.84 psi &lt;- psi1 } } c(psi, psi_low, psi_high) #&gt; [1] -0.05041591 -0.22312099 0.33312901 "],["session-information-r.html", "Session information: R", " Session information: R For reproducibility. # install.packages(&quot;sessioninfo&quot;) sessioninfo::session_info() #&gt; ─ Session info ─────────────────────────────────────────────────────────────── #&gt; setting value #&gt; version R version 4.4.1 (2024-06-14) #&gt; os macOS Sonoma 14.5 #&gt; system aarch64, darwin20 #&gt; ui X11 #&gt; language (EN) #&gt; collate en_US.UTF-8 #&gt; ctype en_US.UTF-8 #&gt; tz Europe/London #&gt; date 2024-06-16 #&gt; pandoc 3.2 @ /opt/homebrew/bin/ (via rmarkdown) #&gt; #&gt; ─ Packages ─────────────────────────────────────────────────────────────────── #&gt; package * version date (UTC) lib source #&gt; bookdown 0.39 2024-04-15 [1] CRAN (R 4.4.0) #&gt; bslib 0.7.0 2024-03-29 [1] CRAN (R 4.4.0) #&gt; cachem 1.1.0 2024-05-16 [1] CRAN (R 4.4.0) #&gt; cli 3.6.2 2023-12-11 [1] CRAN (R 4.4.0) #&gt; digest 0.6.35 2024-03-11 [1] CRAN (R 4.4.0) #&gt; evaluate 0.24.0 2024-06-10 [1] CRAN (R 4.4.0) #&gt; fastmap 1.2.0 2024-05-15 [1] CRAN (R 4.4.0) #&gt; htmltools 0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0) #&gt; jquerylib 0.1.4 2021-04-26 [1] CRAN (R 4.4.0) #&gt; jsonlite 1.8.8 2023-12-04 [1] CRAN (R 4.4.0) #&gt; knitr 1.47 2024-05-29 [1] CRAN (R 4.4.0) #&gt; lifecycle 1.0.4 2023-11-07 [1] CRAN (R 4.4.0) #&gt; R6 2.5.1 2021-08-19 [1] CRAN (R 4.4.0) #&gt; rlang 1.1.4 2024-06-04 [1] CRAN (R 4.4.0) #&gt; rmarkdown 2.27 2024-05-17 [1] CRAN (R 4.4.0) #&gt; rstudioapi 0.16.0 2024-03-24 [1] CRAN (R 4.4.0) #&gt; sass 0.4.9 2024-03-15 [1] CRAN (R 4.4.0) #&gt; sessioninfo 1.2.2 2021-12-06 [1] CRAN (R 4.4.0) #&gt; xfun 0.44 2024-05-15 [1] CRAN (R 4.4.0) #&gt; yaml 2.3.8 2023-12-11 [1] CRAN (R 4.4.0) #&gt; #&gt; [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library #&gt; #&gt; ────────────────────────────────────────────────────────────────────────────── "],["why-model-stata.html", "11. Why model: Stata Program 11.1 Program 11.2 Program 11.3", " 11. Why model: Stata library(Statamarkdown) do dependency checking extremes consistency and verifying not already installed... all files already exist and are up to date. checking tomata consistency and verifying not already installed... all files already exist and are up to date. /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 11.1 Figures 11.1, 11.2, and 11.3 Sample averages by treatment level clear **Figure 11.1** *create the dataset* input A Y 1 200 1 150 1 220 1 110 1 50 1 180 1 90 1 170 0 170 0 30 0 70 0 110 0 80 0 50 0 10 0 20 end *Save the data* qui save ./data/fig1, replace *Build the scatterplot* scatter Y A, ylab(0(50)250) xlab(0 1) xscale(range(-0.5 1.5)) qui gr export figs/stata-fig-11-1.png, replace *Output the mean values for Y in each level of A* bysort A: sum Y A Y 1. 1 200 2. 1 150 3. 1 220 4. 1 110 5. 1 50 6. 1 180 7. 1 90 8. 1 170 9. 0 170 10. 0 30 11. 0 70 12. 0 110 13. 0 80 14. 0 50 15. 0 10 16. 0 20 17. end -------------------------------------------------------------------------------------- -&gt; A = 0 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 8 67.5 53.11712 10 170 -------------------------------------------------------------------------------------- -&gt; A = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 8 146.25 58.2942 50 220 *Clear the workspace to be able to use a new dataset* clear **Figure 11.2** input A Y 1 110 1 80 1 50 1 40 2 170 2 30 2 70 2 50 3 110 3 50 3 180 3 130 4 200 4 150 4 220 4 210 end qui save ./data/fig2, replace scatter Y A, ylab(0(50)250) xlab(0(1)4) xscale(range(0 4.5)) qui gr export figs/stata-fig-11-2.png, replace bysort A: sum Y A Y 1. 1 110 2. 1 80 3. 1 50 4. 1 40 5. 2 170 6. 2 30 7. 2 70 8. 2 50 9. 3 110 10. 3 50 11. 3 180 12. 3 130 13. 4 200 14. 4 150 15. 4 220 16. 4 210 17. end -------------------------------------------------------------------------------------- -&gt; A = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 70 31.62278 40 110 -------------------------------------------------------------------------------------- -&gt; A = 2 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 80 62.18253 30 170 -------------------------------------------------------------------------------------- -&gt; A = 3 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 117.5 53.77422 50 180 -------------------------------------------------------------------------------------- -&gt; A = 4 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- Y | 4 195 31.09126 150 220 clear **Figure 11.3** input A Y 3 21 11 54 17 33 23 101 29 85 37 65 41 157 53 120 67 111 79 200 83 140 97 220 60 230 71 217 15 11 45 190 end qui save ./data/fig3, replace scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) qui gr export figs/stata-fig-11-3.png, replace A Y 1. 3 21 2. 11 54 3. 17 33 4. 23 101 5. 29 85 6. 37 65 7. 41 157 8. 53 120 9. 67 111 10. 79 200 11. 83 140 12. 97 220 13. 60 230 14. 71 217 15. 15 11 16. 45 190 17. end Program 11.2 2-parameter linear model Creates Figure 11.4, parameter estimates with 95% confidence intervals from Section 11.2, and parameter estimates with 95% confidence intervals from Section 11.3 **Section 11.2: parametric estimators** *Reload data use ./data/fig3, clear *Plot the data* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) *Fit the regression model* regress Y A, noheader cformat(%5.2f) *Output the estimated mean Y value when A = 90* lincom _b[_cons] + 90*_b[A] *Plot the data with the regression line: Fig 11.4* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) || lfit Y A qui gr export figs/stata-fig-11-4.png, replace Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 2.14 0.40 5.35 0.000 1.28 2.99 _cons | 24.55 21.33 1.15 0.269 -21.20 70.29 ------------------------------------------------------------------------------ ( 1) 90*A + _cons = 0 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 216.89 20.8614 10.40 0.000 172.1468 261.6333 ------------------------------------------------------------------------------ **Section 11.3: non-parametric estimation* * Reload the data use ./data/fig1, clear *Fit the regression model* regress Y A, noheader cformat(%5.2f) *E[Y|A=1]* di 67.50 + 78.75 Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 78.75 27.88 2.82 0.014 18.95 138.55 _cons | 67.50 19.72 3.42 0.004 25.21 109.79 ------------------------------------------------------------------------------ 146.25 Program 11.3 3-parameter linear model Creates Figure 11.5 and Parameter estimates for Section 11.4 * Reload the data use ./data/fig3, clear *Create the product term* gen Asq = A*A *Fit the regression model* regress Y A Asq, noheader cformat(%5.2f) *Output the estimated mean Y value when A = 90* lincom _b[_cons] + 90*_b[A] + 90*90*_b[Asq] *Plot the data with the regression line: Fig 11.5* scatter Y A, ylab(0(50)250) xlab(0(10)100) xscale(range(0 100)) || qfit Y A qui gr export figs/stata-fig-11-5.png, replace Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- A | 4.11 1.53 2.68 0.019 0.80 7.41 Asq | -0.02 0.02 -1.33 0.206 -0.05 0.01 _cons | -7.41 31.75 -0.23 0.819 -75.99 61.18 ------------------------------------------------------------------------------ ( 1) 90*A + 8100*Asq + _cons = 0 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 197.1269 25.16157 7.83 0.000 142.7687 251.4852 ------------------------------------------------------------------------------ "],["ip-weighting-and-marginal-structural-models-stata.html", "12. IP Weighting and Marginal Structural Models: Stata Program 12.1 Program 12.2 Program 12.3 Program 12.4 Program 12.5 Program 12.6 Program 12.7", " 12. IP Weighting and Marginal Structural Models: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 12.1 Descriptive statistics from NHEFS data (Table 12.1) use ./data/nhefs, clear /*Provisionally ignore subjects with missing values for follow-up weight*/ /*Sample size after exclusion: N = 1566*/ drop if wt82==. /* Calculate mean weight change in those with and without smoking cessation*/ label define qsmk 0 &quot;No smoking cessation&quot; 1 &quot;Smoking cessation&quot; label values qsmk qsmk by qsmk, sort: egen years = mean(age) if age &lt; . label var years &quot;Age, years&quot; by qsmk, sort: egen male = mean(100 * (sex==0)) if sex &lt; . label var male &quot;Men, %&quot; by qsmk, sort: egen white = mean(100 * (race==0)) if race &lt; . label var white &quot;White, %&quot; by qsmk, sort: egen university = mean(100 * (education == 5)) if education &lt; . label var university &quot;University, %&quot; by qsmk, sort: egen kg = mean(wt71) if wt71 &lt; . label var kg &quot;Weight, kg&quot; by qsmk, sort: egen cigs = mean(smokeintensity) if smokeintensity &lt; . label var cigs &quot;Cigarettes/day&quot; by qsmk, sort: egen meansmkyrs = mean(smokeyrs) if smokeyrs &lt; . label var kg &quot;Years smoking&quot; by qsmk, sort: egen noexer = mean(100 * (exercise == 2)) if exercise &lt; . label var noexer &quot;Little/no exercise&quot; by qsmk, sort: egen inactive = mean(100 * (active==2)) if active &lt; . label var inactive &quot;Inactive daily life&quot; qui save ./data/nhefs-formatted, replace (63 observations deleted) use ./data/nhefs-formatted, clear /*Output table*/ foreach var of varlist years male white university kg cigs meansmkyrs noexer inactive { tabdisp qsmk, cell(`var&#39;) format(%3.1f) } 2. tabdisp qsmk, cell(`var&#39;) format(%3.1f) 3. } --------------------------------- quit smoking between | baseline and 1982 | Age, years ---------------------+----------- No smoking cessation | 42.8 Smoking cessation | 46.2 --------------------------------- --------------------------------- quit smoking between | baseline and 1982 | Men, % ---------------------+----------- No smoking cessation | 46.6 Smoking cessation | 54.6 --------------------------------- --------------------------------- quit smoking between | baseline and 1982 | White, % ---------------------+----------- No smoking cessation | 85.4 Smoking cessation | 91.1 --------------------------------- ------------------------------------ quit smoking between | baseline and 1982 | University, % ---------------------+-------------- No smoking cessation | 9.9 Smoking cessation | 15.4 ------------------------------------ ------------------------------------ quit smoking between | baseline and 1982 | Years smoking ---------------------+-------------- No smoking cessation | 70.3 Smoking cessation | 72.4 ------------------------------------ ------------------------------------- quit smoking between | baseline and 1982 | Cigarettes/day ---------------------+--------------- No smoking cessation | 21.2 Smoking cessation | 18.6 ------------------------------------- --------------------------------- quit smoking between | baseline and 1982 | meansmkyrs ---------------------+----------- No smoking cessation | 24.1 Smoking cessation | 26.0 --------------------------------- ----------------------------------------- quit smoking between | baseline and 1982 | Little/no exercise ---------------------+------------------- No smoking cessation | 37.9 Smoking cessation | 40.7 ----------------------------------------- ------------------------------------------ quit smoking between | baseline and 1982 | Inactive daily life ---------------------+-------------------- No smoking cessation | 8.9 Smoking cessation | 11.2 ------------------------------------------ Program 12.2 Estimating IP weights for Section 12.2 Data from NHEFS use ./data/nhefs-formatted, clear /*Fit a logistic model for the IP weights*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 /*Output predicted conditional probability of quitting smoking for each individual*/ predict p_qsmk, pr /*Generate nonstabilized weights as P(A=1|covariates) if A = 1 and */ /* 1-P(A=1|covariates) if A = 0*/ gen w=. replace w=1/p_qsmk if qsmk==1 replace w=1/(1-p_qsmk) if qsmk==0 /*Check the mean of the weights; we expect it to be close to 2.0*/ summarize w /*Fit marginal structural model in the pseudopopulation*/ /*Weights assigned using pweight = w*/ /*Robust standard errors using cluster() option where &#39;seqn&#39; is the ID variable*/ regress wt82_71 qsmk [pweight=w], cluster(seqn) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- w | 1,566 1.996284 1.474787 1.053742 16.70009 (sum of wgt is 3,126.18084549904) Linear regression Number of obs = 1,566 F(1, 1565) = 42.81 Prob &gt; F = 0.0000 R-squared = 0.0435 Root MSE = 8.0713 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.440535 .5258294 6.54 0.000 2.409131 4.47194 _cons | 1.779978 .2248742 7.92 0.000 1.338892 2.221065 ------------------------------------------------------------------------------ Program 12.3 Estimating stabilized IP weights for Section 12.3 Data from NHEFS use ./data/nhefs-formatted, clear /*Fit a logistic model for the denominator of the IP weights and predict the */ /* conditional probability of smoking */ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */ logit qsmk predict pn_qsmk, pr /*Generate stabilized weights as f(A)/f(A|L)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 /*Check distribution of the stabilized weights*/ summarize sw_a /*Fit marginal structural model in the pseudopopulation*/ regress wt82_71 qsmk [pweight=sw_a], cluster(seqn) /********************************************************** FINE POINT 12.2 Checking positivity **********************************************************/ /*Check for missing values within strata of covariates, for example: */ tab age qsmk if race==0 &amp; sex==1 &amp; wt82!=. tab age qsmk if race==1 &amp; sex==1 &amp; wt82!=. Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = 0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,566 .9988444 .2882233 .3312489 4.297662 (sum of wgt is 1,564.19025221467) Linear regression Number of obs = 1,566 F(1, 1565) = 42.81 Prob &gt; F = 0.0000 R-squared = 0.0359 Root MSE = 7.7972 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.440535 .5258294 6.54 0.000 2.409131 4.47194 _cons | 1.779978 .2248742 7.92 0.000 1.338892 2.221065 ------------------------------------------------------------------------------ | quit smoking between | baseline and 1982 age | No smokin Smoking c | Total -----------+----------------------+---------- 25 | 24 3 | 27 26 | 14 5 | 19 27 | 18 2 | 20 28 | 20 5 | 25 29 | 15 4 | 19 30 | 14 5 | 19 31 | 11 5 | 16 32 | 14 7 | 21 33 | 12 3 | 15 34 | 22 5 | 27 35 | 16 5 | 21 36 | 13 3 | 16 37 | 14 1 | 15 38 | 6 2 | 8 39 | 19 4 | 23 40 | 10 4 | 14 41 | 13 3 | 16 42 | 16 3 | 19 43 | 14 3 | 17 44 | 9 4 | 13 45 | 12 5 | 17 46 | 19 4 | 23 47 | 19 4 | 23 48 | 19 4 | 23 49 | 11 3 | 14 50 | 18 4 | 22 51 | 9 3 | 12 52 | 11 3 | 14 53 | 11 4 | 15 54 | 17 9 | 26 55 | 9 4 | 13 56 | 8 7 | 15 57 | 9 2 | 11 58 | 8 4 | 12 59 | 5 4 | 9 60 | 5 4 | 9 61 | 5 2 | 7 62 | 6 5 | 11 63 | 3 3 | 6 64 | 7 1 | 8 65 | 3 2 | 5 66 | 4 0 | 4 67 | 2 0 | 2 69 | 6 2 | 8 70 | 2 1 | 3 71 | 0 1 | 1 72 | 2 2 | 4 74 | 0 1 | 1 -----------+----------------------+---------- Total | 524 164 | 688 | quit smoking between | baseline and 1982 age | No smokin Smoking c | Total -----------+----------------------+---------- 25 | 3 1 | 4 26 | 3 0 | 3 28 | 3 1 | 4 29 | 1 0 | 1 30 | 4 0 | 4 31 | 3 0 | 3 32 | 8 0 | 8 33 | 2 0 | 2 34 | 2 1 | 3 35 | 3 0 | 3 36 | 5 0 | 5 37 | 3 1 | 4 38 | 4 2 | 6 39 | 1 1 | 2 40 | 2 2 | 4 41 | 3 0 | 3 42 | 3 0 | 3 43 | 4 2 | 6 44 | 3 0 | 3 45 | 1 3 | 4 46 | 5 0 | 5 47 | 3 0 | 3 48 | 4 0 | 4 49 | 1 1 | 2 50 | 2 0 | 2 51 | 4 0 | 4 52 | 1 0 | 1 53 | 2 0 | 2 54 | 2 0 | 2 55 | 3 0 | 3 56 | 2 1 | 3 57 | 2 1 | 3 61 | 1 1 | 2 67 | 1 0 | 1 68 | 1 0 | 1 69 | 2 0 | 2 70 | 0 1 | 1 -----------+----------------------+---------- Total | 97 19 | 116 Program 12.4 Estimating the parameters of a marginal structural mean model with a continuous treatment Data from NHEFS Section 12.4 use ./data/nhefs-formatted, clear * drop sw_a /*Analysis restricted to subjects reporting &lt;=25 cig/day at baseline: N = 1162*/ keep if smokeintensity &lt;=25 /*Fit a linear model for the denominator of the IP weights and calculate the */ /* mean expected smoking intensity*/ regress smkintensity82_71 sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 quietly predict p_den /*Generate the denisty of the denomiator expectation using the mean expected */ /* smoking intensity and the residuals, assuming a normal distribution*/ /*Note: The regress command in Stata saves the root mean squared error for the */ /* immediate regression as e(rmse), thus there is no need to calculate it again. */ gen dens_den = normalden(smkintensity82_71, p_den, e(rmse)) /*Fit a linear model for the numerator of ip weights, calculate the mean */ /* expected value, and generate the density*/ quietly regress smkintensity82_71 quietly predict p_num gen dens_num = normalden( smkintensity82_71, p_num, e(rmse)) /*Generate the final stabilized weights from the estimated numerator and */ /* denominator, and check the weights distribution*/ gen sw_a=dens_num/dens_den summarize sw_a /*Fit a marginal structural model in the pseudopopulation*/ regress wt82_71 c.smkintensity82_71##c.smkintensity82_71 [pweight=sw_a], cluster(seqn) /*Output the estimated mean Y value when smoke intensity is unchanged from */ /* baseline to 1982 */ lincom _b[_cons] /*Output the estimated mean Y value when smoke intensity increases by 20 from */ /* baseline to 1982*/ lincom _b[_cons] + 20*_b[smkintensity82_71 ] + /// 400*_b[c.smkintensity82_71#c.smkintensity82_71] (404 observations deleted) Source | SS df MS Number of obs = 1,162 -------------+---------------------------------- F(18, 1143) = 5.39 Model | 9956.95654 18 553.164252 Prob &gt; F = 0.0000 Residual | 117260.18 1,143 102.589834 R-squared = 0.0783 -------------+---------------------------------- Adj R-squared = 0.0638 Total | 127217.137 1,161 109.575484 Root MSE = 10.129 ----------------------------------------------------------------------------------- smkintensity82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | 1.087021 .7425694 1.46 0.144 -.3699308 2.543973 race | .2319789 .8434739 0.28 0.783 -1.422952 1.88691 age | -.8099902 .2555388 -3.17 0.002 -1.311368 -.3086124 | c.age#c.age | .0066545 .0026849 2.48 0.013 .0013865 .0119224 | education | 1 | 1.508097 1.184063 1.27 0.203 -.8150843 3.831278 2 | 2.02692 1.133772 1.79 0.074 -.1975876 4.251428 3 | 2.240314 1.022556 2.19 0.029 .2340167 4.246611 4 | 2.528767 1.44702 1.75 0.081 -.3103458 5.36788 | smokeintensity | -.3589684 .2246653 -1.60 0.110 -.799771 .0818342 | c.smokeintensity#| c.smokeintensity | .0019582 .0085753 0.23 0.819 -.0148668 .0187832 | smokeyrs | .3857088 .1416765 2.72 0.007 .1077336 .6636841 | c.smokeyrs#| c.smokeyrs | -.0054871 .0023837 -2.30 0.022 -.0101641 -.0008101 | exercise | 0 | 1.996904 .9080421 2.20 0.028 .215288 3.778521 1 | .988812 .6929239 1.43 0.154 -.3707334 2.348357 | active | 0 | .8451341 1.098573 0.77 0.442 -1.310312 3.000581 1 | .800114 1.08438 0.74 0.461 -1.327485 2.927712 | wt71 | -.0656882 .136955 -0.48 0.632 -.3343996 .2030232 | c.wt71#c.wt71 | .0005711 .000877 0.65 0.515 -.0011496 .0022918 | _cons | 16.86761 7.109189 2.37 0.018 2.91909 30.81614 ----------------------------------------------------------------------------------- Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,162 .9968057 .3222937 .1938336 5.102339 (sum of wgt is 1,158.28818286955) Linear regression Number of obs = 1,162 F(2, 1161) = 12.75 Prob &gt; F = 0.0000 R-squared = 0.0233 Root MSE = 7.7864 (Std. err. adjusted for 1,162 clusters in seqn) ------------------------------------------------------------------------------------- | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] --------------------+---------------------------------------------------------------- smkintensity82_71 | -.1089889 .0315762 -3.45 0.001 -.1709417 -.0470361 | c. | smkintensity82_71#| c.smkintensity82_71 | .0026949 .0024203 1.11 0.266 -.0020537 .0074436 | _cons | 2.004525 .295502 6.78 0.000 1.424747 2.584302 ------------------------------------------------------------------------------------- ( 1) _cons = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 2.004525 .295502 6.78 0.000 1.424747 2.584302 ------------------------------------------------------------------------------ ( 1) 20*smkintensity82_71 + 400*c.smkintensity82_71#c.smkintensity82_71 + _cons = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | .9027234 1.310533 0.69 0.491 -1.668554 3.474001 ------------------------------------------------------------------------------ Program 12.5 Estimating the parameters of a marginal structural logistic model Data from NHEFS Section 12.4 use ./data/nhefs, clear /*Provisionally ignore subjects with missing values for follow-up weight*/ /*Sample size after exclusion: N = 1566*/ drop if wt82==. /*Estimate the stabilized weights for quitting smoking as in PROGRAM 12.3*/ /*Fit a logistic model for the denominator of the IP weights and predict the */ /* conditional probability of smoking*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit a logistic model for the numerator of ip weights and predict Pr(A=1) */ logit qsmk predict pn_qsmk, pr /*Generate stabilized weights as f(A)/f(A|L)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 summarize sw_a /*Fit marginal structural model in the pseudopopulation*/ /*NOTE: Stata has two commands for logistic regression, logit and logistic*/ /*Using logistic allows us to output the odds ratios directly*/ /*We can also output odds ratios from the logit command using the or option */ /* (default logit output is regression coefficients*/ logistic death qsmk [pweight=sw_a], cluster(seqn) (63 observations deleted) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = -0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = -0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (1,566 missing values generated) (403 real changes made) (1,163 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,566 .9988444 .2882233 .3312489 4.297662 Logistic regression Number of obs = 1,566 Wald chi2(1) = 0.04 Prob &gt; chi2 = 0.8482 Log pseudolikelihood = -749.11596 Pseudo R2 = 0.0000 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust death | Odds ratio std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 1.030578 .1621842 0.19 0.848 .7570517 1.402931 _cons | .2252711 .0177882 -18.88 0.000 .1929707 .2629781 ------------------------------------------------------------------------------ Note: _cons estimates baseline odds. Program 12.6 Assessing effect modification by sex using a marginal structural mean model Data from NHEFS Section 12.5 use ./data/nhefs, clear * drop pd_qsmk pn_qsmk sw_a /*Check distribution of sex*/ tab sex /*Fit logistc model for the denominator of IP weights, as in PROGRAM 12.3 */ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit logistic model for the numerator of IP weights, no including sex */ logit qsmk sex predict pn_qsmk, pr /*Generate IP weights as before*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 summarize sw_a /*Fit marginal structural model in the pseudopopulation, including interaction */ /* term between quitting smoking and sex*/ regress wt82_71 qsmk##sex [pw=sw_a], cluster(seqn) sex | Freq. Percent Cum. ------------+----------------------------------- 0 | 799 49.05 49.05 1 | 830 50.95 100.00 ------------+----------------------------------- Total | 1,629 100.00 Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -884.53806 Iteration 2: Log likelihood = -883.35064 Iteration 3: Log likelihood = -883.34876 Iteration 4: Log likelihood = -883.34876 Logistic regression Number of obs = 1,629 LR chi2(18) = 109.59 Prob &gt; chi2 = 0.0000 Log likelihood = -883.34876 Pseudo R2 = 0.0584 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5075218 .1482316 -3.42 0.001 -.7980505 -.2169932 race | -.8502312 .2058722 -4.13 0.000 -1.253733 -.4467292 age | .1030132 .0488996 2.11 0.035 .0071718 .1988547 | c.age#c.age | -.0006052 .0005074 -1.19 0.233 -.0015998 .0003893 | education | 1 | -.3796632 .2203948 -1.72 0.085 -.811629 .0523026 2 | -.4779835 .2141771 -2.23 0.026 -.8977629 -.0582041 3 | -.3639645 .1885776 -1.93 0.054 -.7335698 .0056409 4 | -.4221892 .2717235 -1.55 0.120 -.9547574 .110379 | smokeintensity | -.0651561 .0147589 -4.41 0.000 -.0940831 -.0362292 | c.smokeintensity#| c.smokeintensity | .0008461 .0002758 3.07 0.002 .0003054 .0013867 | smokeyrs | -.0733708 .0269958 -2.72 0.007 -.1262816 -.02046 | c.smokeyrs#| c.smokeyrs | .0008384 .0004435 1.89 0.059 -.0000307 .0017076 | exercise | 0 | -.3550517 .1799293 -1.97 0.048 -.7077067 -.0023967 1 | -.06364 .1351256 -0.47 0.638 -.3284812 .2012013 | active | 0 | -.0683123 .2087269 -0.33 0.743 -.4774095 .3407849 1 | -.057437 .2039967 -0.28 0.778 -.4572632 .3423892 | wt71 | -.0128478 .0222829 -0.58 0.564 -.0565214 .0308258 | c.wt71#c.wt71 | .0001209 .0001352 0.89 0.371 -.000144 .0003859 | _cons | -1.185875 1.263142 -0.94 0.348 -3.661588 1.289838 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -933.49896 Iteration 2: Log likelihood = -933.49126 Iteration 3: Log likelihood = -933.49126 Logistic regression Number of obs = 1,629 LR chi2(1) = 9.30 Prob &gt; chi2 = 0.0023 Log likelihood = -933.49126 Pseudo R2 = 0.0050 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- sex | -.3441893 .1131341 -3.04 0.002 -.565928 -.1224506 _cons | -.8634417 .0774517 -11.15 0.000 -1.015244 -.7116391 ------------------------------------------------------------------------------ (1,629 missing values generated) (428 real changes made) (1,201 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw_a | 1,629 .9991318 .2636164 .2901148 3.683352 (sum of wgt is 1,562.01032829285) Linear regression Number of obs = 1,566 F(3, 1565) = 16.31 Prob &gt; F = 0.0000 R-squared = 0.0379 Root MSE = 7.8024 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- 1.qsmk | 3.60623 .6576053 5.48 0.000 2.31635 4.89611 1.sex | -.0040025 .4496206 -0.01 0.993 -.8859246 .8779197 | qsmk#sex | 1 1 | -.161224 1.036143 -0.16 0.876 -2.1936 1.871152 | _cons | 1.759045 .3102511 5.67 0.000 1.150494 2.367597 ------------------------------------------------------------------------------ Program 12.7 Estimating IP weights to adjust for selection bias due to censoring Data from NHEFS Section 12.6 use ./data/nhefs, clear /*Analysis including all individuals regardless of missing wt82 status: N=1629*/ /*Generate censoring indicator: C = 1 if wt82 missing*/ gen byte cens = (wt82 == .) /*Check distribution of censoring by quitting smoking and baseline weight*/ tab cens qsmk, column bys cens: summarize wt71 /*Fit logistic regression model for the denominator of IP weight for A*/ logit qsmk sex race c.age##c.age ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active c.wt71##c.wt71 predict pd_qsmk, pr /*Fit logistic regression model for the numerator of IP weights for A*/ logit qsmk predict pn_qsmk, pr /*Fit logistic regression model for the denominator of IP weights for C, */ /* including quitting smoking*/ logit cens qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 predict pd_cens, pr /*Fit logistic regression model for the numerator of IP weights for C, */ /* including quitting smoking */ logit cens qsmk predict pn_cens, pr /*Generate the stabilized weights for A (sw_a)*/ gen sw_a=. replace sw_a=pn_qsmk/pd_qsmk if qsmk==1 replace sw_a=(1-pn_qsmk)/(1-pd_qsmk) if qsmk==0 /*Generate the stabilized weights for C (sw_c)*/ /*NOTE: the conditional probability estimates generated by our logistic models */ /* for C represent the conditional probability of being censored (C=1)*/ /*We want weights for the conditional probability of bing uncensored, Pr(C=0|A,L)*/ gen sw_c=. replace sw_c=(1-pn_cens)/(1-pd_cens) if cens==0 /*Generate the final stabilized weights and check distribution*/ gen sw=sw_a*sw_c summarize sw /*Fit marginal structural model in the pseudopopulation*/ regress wt82_71 qsmk [pw=sw], cluster(seqn) | Key | |-------------------| | frequency | | column percentage | +-------------------+ | quit smoking between | baseline and 1982 cens | 0 1 | Total -----------+----------------------+---------- 0 | 1,163 403 | 1,566 | 96.84 94.16 | 96.13 -----------+----------------------+---------- 1 | 38 25 | 63 | 3.16 5.84 | 3.87 -----------+----------------------+---------- Total | 1,201 428 | 1,629 | 100.00 100.00 | 100.00 -------------------------------------------------------------------------------------- -&gt; cens = 0 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt71 | 1,566 70.83092 15.3149 39.58 151.73 -------------------------------------------------------------------------------------- -&gt; cens = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt71 | 63 76.55079 23.3326 36.17 169.19 Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -884.53806 Iteration 2: Log likelihood = -883.35064 Iteration 3: Log likelihood = -883.34876 Iteration 4: Log likelihood = -883.34876 Logistic regression Number of obs = 1,629 LR chi2(18) = 109.59 Prob &gt; chi2 = 0.0000 Log likelihood = -883.34876 Pseudo R2 = 0.0584 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5075218 .1482316 -3.42 0.001 -.7980505 -.2169932 race | -.8502312 .2058722 -4.13 0.000 -1.253733 -.4467292 age | .1030132 .0488996 2.11 0.035 .0071718 .1988547 | c.age#c.age | -.0006052 .0005074 -1.19 0.233 -.0015998 .0003893 | education | 1 | -.3796632 .2203948 -1.72 0.085 -.811629 .0523026 2 | -.4779835 .2141771 -2.23 0.026 -.8977629 -.0582041 3 | -.3639645 .1885776 -1.93 0.054 -.7335698 .0056409 4 | -.4221892 .2717235 -1.55 0.120 -.9547574 .110379 | smokeintensity | -.0651561 .0147589 -4.41 0.000 -.0940831 -.0362292 | c.smokeintensity#| c.smokeintensity | .0008461 .0002758 3.07 0.002 .0003054 .0013867 | smokeyrs | -.0733708 .0269958 -2.72 0.007 -.1262816 -.02046 | c.smokeyrs#| c.smokeyrs | .0008384 .0004435 1.89 0.059 -.0000307 .0017076 | exercise | 0 | -.3550517 .1799293 -1.97 0.048 -.7077067 -.0023967 1 | -.06364 .1351256 -0.47 0.638 -.3284812 .2012013 | active | 0 | -.0683123 .2087269 -0.33 0.743 -.4774095 .3407849 1 | -.057437 .2039967 -0.28 0.778 -.4572632 .3423892 | wt71 | -.0128478 .0222829 -0.58 0.564 -.0565214 .0308258 | c.wt71#c.wt71 | .0001209 .0001352 0.89 0.371 -.000144 .0003859 | _cons | -1.185875 1.263142 -0.94 0.348 -3.661588 1.289838 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -938.14308 Iteration 1: Log likelihood = -938.14308 Logistic regression Number of obs = 1,629 LR chi2(0) = 0.00 Prob &gt; chi2 = . Log likelihood = -938.14308 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.031787 .0562947 -18.33 0.000 -1.142122 -.9214511 ------------------------------------------------------------------------------ Iteration 0: Log likelihood = -266.67873 Iteration 1: Log likelihood = -238.48654 Iteration 2: Log likelihood = -232.82848 Iteration 3: Log likelihood = -232.68043 Iteration 4: Log likelihood = -232.67999 Iteration 5: Log likelihood = -232.67999 Logistic regression Number of obs = 1,629 LR chi2(19) = 68.00 Prob &gt; chi2 = 0.0000 Log likelihood = -232.67999 Pseudo R2 = 0.1275 ----------------------------------------------------------------------------------- cens | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | .5168674 .2877162 1.80 0.072 -.0470459 1.080781 sex | .0573131 .3302775 0.17 0.862 -.590019 .7046452 race | -.0122715 .4524888 -0.03 0.978 -.8991332 .8745902 age | -.2697293 .1174647 -2.30 0.022 -.4999559 -.0395027 | c.age#c.age | .0028837 .0011135 2.59 0.010 .0007012 .0050661 | education | 1 | .3823818 .5601808 0.68 0.495 -.7155523 1.480316 2 | -.0584066 .5749586 -0.10 0.919 -1.185305 1.068491 3 | .2176937 .5225008 0.42 0.677 -.8063891 1.241776 4 | .5208288 .6678735 0.78 0.435 -.7881792 1.829837 | smokeintensity | .0157119 .0347319 0.45 0.651 -.0523614 .0837851 | c.smokeintensity#| c.smokeintensity | -.0001133 .0006058 -0.19 0.852 -.0013007 .0010742 | smokeyrs | .0785973 .0749576 1.05 0.294 -.0683169 .2255116 | c.smokeyrs#| c.smokeyrs | -.0005569 .0010318 -0.54 0.589 -.0025791 .0014653 | exercise | 0 | .583989 .3723133 1.57 0.117 -.1457317 1.31371 1 | -.3874824 .3439133 -1.13 0.260 -1.06154 .2865754 | active | 0 | -.7065829 .3964577 -1.78 0.075 -1.483626 .0704599 1 | -.9540614 .3893181 -2.45 0.014 -1.717111 -.1910119 | wt71 | -.0878871 .0400115 -2.20 0.028 -.1663082 -.0094659 | c.wt71#c.wt71 | .0006351 .0002257 2.81 0.005 .0001927 .0010775 | _cons | 3.754678 2.651222 1.42 0.157 -1.441622 8.950978 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -266.67873 Iteration 1: Log likelihood = -264.00252 Iteration 2: Log likelihood = -263.88028 Iteration 3: Log likelihood = -263.88009 Iteration 4: Log likelihood = -263.88009 Logistic regression Number of obs = 1,629 LR chi2(1) = 5.60 Prob &gt; chi2 = 0.0180 Log likelihood = -263.88009 Pseudo R2 = 0.0105 ------------------------------------------------------------------------------ cens | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | .6411113 .2639262 2.43 0.015 .1238255 1.158397 _cons | -3.421172 .1648503 -20.75 0.000 -3.744273 -3.098071 ------------------------------------------------------------------------------ (1,629 missing values generated) (428 real changes made) (1,201 real changes made) (1,629 missing values generated) (1,566 real changes made) (63 missing values generated) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw | 1,566 .9962351 .2819583 .3546469 4.093113 (sum of wgt is 1,560.10419079661) Linear regression Number of obs = 1,566 F(1, 1565) = 44.19 Prob &gt; F = 0.0000 R-squared = 0.0363 Root MSE = 7.8652 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------ | Robust wt82_71 | Coefficient std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.496493 .5259796 6.65 0.000 2.464794 4.528192 _cons | 1.66199 .2328986 7.14 0.000 1.205164 2.118816 ------------------------------------------------------------------------------ "],["standardization-and-the-parametric-g-formula-stata.html", "13. Standardization and the parametric G-formula: Stata Program 13.1 Program 13.2 Program 13.3 Program 13.4", " 13. Standardization and the parametric G-formula: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 13.1 Estimating the mean outcome within levels of treatment and confounders: Data from NHEFS Section 13.2 use ./data/nhefs-formatted, clear /* Estimate the the conditional mean outcome within strata of quitting smoking and covariates, among the uncensored */ glm wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// qsmk##c.smokeintensity predict meanY summarize meanY /*Look at the predicted value for subject ID = 24770*/ list meanY if seqn == 24770 /*Observed mean outcome for comparison */ summarize wt82_71 note: 1.qsmk omitted because of collinearity. note: smokeintensity omitted because of collinearity. Iteration 0: Log likelihood = -5328.5765 Generalized linear models Number of obs = 1,566 Optimization : ML Residual df = 1,545 Scale parameter = 53.5683 Deviance = 82763.02862 (1/df) Deviance = 53.5683 Pearson = 82763.02862 (1/df) Pearson = 53.5683 Variance function: V(u) = 1 [Gaussian] Link function : g(u) = u [Identity] AIC = 6.832154 Log likelihood = -5328.576456 BIC = 71397.58 ------------------------------------------------------------------------------------ | OIM wt82_71 | Coefficient std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .973692 4.145496 sex | -1.430272 .4689576 -3.05 0.002 -2.349412 -.5111317 race | .5601096 .5818888 0.96 0.336 -.5803714 1.700591 age | .3596353 .1633188 2.20 0.028 .0395364 .6797342 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094841 -.0027178 | education | 1 | .194977 .7413692 0.26 0.793 -1.25808 1.648034 2 | .9854211 .7012116 1.41 0.160 -.3889285 2.359771 3 | .7512894 .6339153 1.19 0.236 -.4911617 1.993741 4 | 1.686547 .8716593 1.93 0.053 -.0218744 3.394967 | smokeintensity | .0491365 .0517254 0.95 0.342 -.0522435 .1505165 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028292 .0008479 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045384 .3141212 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048921 .0011592 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.449256 .7414301 1 | -.0579374 .4316468 -0.13 0.893 -.9039497 .7880749 | active | 0 | .2613779 .6845577 0.38 0.703 -1.08033 1.603086 1 | -.6861916 .6739131 -1.02 0.309 -2.007037 .6346539 | wt71 | .0455018 .0833709 0.55 0.585 -.1179022 .2089058 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019937 .0000631 | qsmk | Smoking cessation | 0 (omitted) smokeintensity | 0 (omitted) | qsmk#| c.smokeintensity | Smoking cessation | .0466628 .0351448 1.33 0.184 -.0222197 .1155453 | _cons | -1.690608 4.388883 -0.39 0.700 -10.29266 6.911444 ------------------------------------------------------------------------------------ (option mu assumed; predicted mean wt82_71) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanY | 1,566 2.6383 3.034683 -10.87582 9.876489 +----------+ | meanY | |----------| 960. | .3421569 | +----------+ Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt82_71 | 1,566 2.6383 7.879913 -41.28047 48.53839 Program 13.2 Standardizing the mean outcome to the baseline confounders Data from Table 2.2 Section 13.3 clear input str10 ID L A Y &quot;Rheia&quot; 0 0 0 &quot;Kronos&quot; 0 0 1 &quot;Demeter&quot; 0 0 0 &quot;Hades&quot; 0 0 0 &quot;Hestia&quot; 0 1 0 &quot;Poseidon&quot; 0 1 0 &quot;Hera&quot; 0 1 0 &quot;Zeus&quot; 0 1 1 &quot;Artemis&quot; 1 0 1 &quot;Apollo&quot; 1 0 1 &quot;Leto&quot; 1 0 0 &quot;Ares&quot; 1 1 1 &quot;Athena&quot; 1 1 1 &quot;Hephaestus&quot; 1 1 1 &quot;Aphrodite&quot; 1 1 1 &quot;Cyclope&quot; 1 1 1 &quot;Persephone&quot; 1 1 1 &quot;Hermes&quot; 1 1 0 &quot;Hebe&quot; 1 1 0 &quot;Dionysus&quot; 1 1 0 end /* i. Data set up for standardization: - create 3 copies of each subject first, - duplicate the dataset and create a variable `interv` which indicates which copy is the duplicate (interv =1) */ expand 2, generate(interv) /* Next, duplicate the original copy (interv = 0) again, and create another variable &#39;interv2&#39; to indicate the copy */ expand 2 if interv == 0, generate(interv2) /* Now, change the value of &#39;interv&#39; to -1 in one of the copies so that there are unique values of interv for each copy */ replace interv = -1 if interv2 ==1 drop interv2 /* Check that the data has the structure you want: - there should be 1566 people in each of the 3 levels of interv*/ tab interv /* Two of the copies will be for computing the standardized result for these two copies (interv = 0 and interv = 1), set the outcome to missing and force qsmk to either 0 or 1, respectively. You may need to edit this part of the code for your outcome and exposure variables */ replace Y = . if interv != -1 replace A = 0 if interv == 0 replace A = 1 if interv == 1 /* Check that the data has the structure you want: for interv = -1, some people quit and some do not; for interv = 0 or 1, noone quits or everyone quits, respectively */ by interv, sort: summarize A *ii.Estimation in original sample* *Now, we do a parametric regression with the covariates we want to adjust for* *You may need to edit this part of the code for the variables you want.* *Because the copies have missing Y, this will only run the regression in the *original copy.* *The double hash between A &amp; L creates a regression model with A and L and a * product term between A and L* regress Y A##L *Ask Stata for expected values - Stata will give you expected values for all * copies, not just the original ones* predict predY, xb *Now ask for a summary of these values by intervention* *These are the standardized outcome estimates: you can subtract them to get the * standardized difference* by interv, sort: summarize predY *iii.OPTIONAL: Output standardized point estimates and difference* *The summary from the last command gives you the standardized estimates* *We can stop there, or we can ask Stata to calculate the standardized difference * and display all the results in a simple table* *The code below can be used as-is without changing any variable names* *The option &quot;quietly&quot; asks Stata not to display the output of some intermediate * calculations* *You can delete this option if you want to see what is happening step-by-step* quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) *Add some row/column descriptions and print results to screen* matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe *to interpret these results:* *row 1, column 2, is the observed mean outcome value in our original sample* *row 2, column 2, is the mean outcome value if everyone had not quit smoking* *row 3, column 2, is the mean outcome value if everyone had quit smoking* *row 4, column 2, is the mean difference outcome value if everyone had quit * smoking compared to if everyone had not quit smoking* ID L A Y 1. &quot;Rheia&quot; 0 0 0 2. &quot;Kronos&quot; 0 0 1 3. &quot;Demeter&quot; 0 0 0 4. &quot;Hades&quot; 0 0 0 5. &quot;Hestia&quot; 0 1 0 6. &quot;Poseidon&quot; 0 1 0 7. &quot;Hera&quot; 0 1 0 8. &quot;Zeus&quot; 0 1 1 9. &quot;Artemis&quot; 1 0 1 10. &quot;Apollo&quot; 1 0 1 11. &quot;Leto&quot; 1 0 0 12. &quot;Ares&quot; 1 1 1 13. &quot;Athena&quot; 1 1 1 14. &quot;Hephaestus&quot; 1 1 1 15. &quot;Aphrodite&quot; 1 1 1 16. &quot;Cyclope&quot; 1 1 1 17. &quot;Persephone&quot; 1 1 1 18. &quot;Hermes&quot; 1 1 0 19. &quot;Hebe&quot; 1 1 0 20. &quot;Dionysus&quot; 1 1 0 21. end (20 observations created) (20 observations created) (20 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 20 33.33 33.33 Original observation | 20 33.33 66.67 Duplicated observation | 20 33.33 100.00 -----------------------+----------------------------------- Total | 60 100.00 (40 real changes made, 40 to missing) (13 real changes made) (7 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 .65 .4893605 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- A | 20 1 0 1 1 Source | SS df MS Number of obs = 20 -------------+---------------------------------- F(3, 16) = 1.07 Model | .833333333 3 .277777778 Prob &gt; F = 0.3909 Residual | 4.16666667 16 .260416667 R-squared = 0.1667 -------------+---------------------------------- Adj R-squared = 0.0104 Total | 5 19 .263157895 Root MSE = .51031 ------------------------------------------------------------------------------ Y | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- 1.A | 1.05e-16 .3608439 0.00 1.000 -.7649549 .7649549 1.L | .4166667 .389756 1.07 0.301 -.4095791 1.242912 | A#L | 1 1 | -5.83e-17 .4959325 -0.00 1.000 -1.05133 1.05133 | _cons | .25 .2551552 0.98 0.342 -.2909048 .7909048 ------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 20 .5 .209427 .25 .6666667 observe[4,2] interv value observed -1 .50000001 E(Y(a=0)) 0 .50000001 E(Y(a=1)) 1 .50000001 difference . 0 Program 13.3 Standardizing the mean outcome to the baseline confounders: Data from NHEFS Section 13.3 use ./data/nhefs-formatted, clear *i.Data set up for standardization: create 3 copies of each subject* *first, duplicate the dataset and create a variable &#39;interv&#39; which indicates * which copy is the duplicate (interv =1) expand 2, generate(interv) *next, duplicate the original copy (interv = 0) again, and create another * variable &#39;interv2&#39; to indicate the copy expand 2 if interv == 0, generate(interv2) *now, change the value of &#39;interv&#39; to -1 in one of the copies so that there are * unique values of interv for each copy* replace interv = -1 if interv2 ==1 drop interv2 *check that the data has the structure you want: there should be 1566 people in * each of the 3 levels of interv* tab interv *two of the copies will be for computing the standardized result* *for these two copies (interv = 0 and interv = 1), set the outcome to missing * and force qsmk to either 0 or 1, respectively* *you may need to edit this part of the code for your outcome and exposure variables* replace wt82_71 = . if interv != -1 replace qsmk = 0 if interv == 0 replace qsmk = 1 if interv == 1 *check that the data has the structure you want: for interv = -1, some people * quit and some do not; for interv = 0 or 1, noone quits or everyone quits, respectively* by interv, sort: summarize qsmk *ii.Estimation in original sample* *Now, we do a parametric regression with the covariates we want to adjust for* *You may need to edit this part of the code for the variables you want.* *Because the copies have missing wt82_71, this will only run the regression in * the original copy* regress wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 qsmk#c.smokeintensity *Ask Stata for expected values - Stata will give you expected values for all * copies, not just the original ones* predict predY, xb *Now ask for a summary of these values by intervention* *These are the standardized outcome estimates: you can subtract them to get the * standardized difference* by interv, sort: summarize predY /* iii.OPTIONAL: Output standardized point estimates and difference - The summary from the last command gives you the standardized estimates - We can stop there, or we can ask Stata to calculate the standardized difference and display all the results in a simple table - The code below can be used as-is without changing any variable names - The option `quietly` asks Stata not to display the output of some intermediate calculations - You can delete this option if you want to see what is happening step-by-step */ quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) * Add some row/column descriptions and print results to screen matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe /* To interpret these results: - row 1, column 2, is the observed mean outcome value in our original sample - row 2, column 2, is the mean outcome value if everyone had not quit smoking - row 3, column 2, is the mean outcome value if everyone had quit smoking - row 4, column 2, is the mean difference outcome value if everyone had quit smoking compared to if everyone had not quit smoking */ /* Addition due to way Statamarkdown works i.e. each code chunk is a separate Stata session */ mata observe = st_matrix(&quot;observe&quot;) mata mata matsave ./data/observe observe, replace *drop the copies* drop if interv != -1 gen meanY_b =. qui save ./data/nhefs_std, replace (1,566 observations created) (1,566 observations created) (1,566 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 1,566 33.33 33.33 Original observation | 1,566 33.33 66.67 Duplicated observation | 1,566 33.33 100.00 -----------------------+----------------------------------- Total | 4,698 100.00 (3,132 real changes made, 3,132 to missing) (403 real changes made) (1,163 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 .2573436 .4373099 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 1 0 1 1 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(20, 1545) = 13.45 Model | 14412.558 20 720.6279 Prob &gt; F = 0.0000 Residual | 82763.0286 1,545 53.5683033 R-squared = 0.1483 -------------+---------------------------------- Adj R-squared = 0.1373 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.319 ------------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .9724486 4.14674 sex | -1.430272 .4689576 -3.05 0.002 -2.350132 -.5104111 race | .5601096 .5818888 0.96 0.336 -.5812656 1.701485 age | .3596353 .1633188 2.20 0.028 .0392854 .6799851 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094868 -.0027151 | education | 1 | .194977 .7413692 0.26 0.793 -1.259219 1.649173 2 | .9854211 .7012116 1.41 0.160 -.390006 2.360848 3 | .7512894 .6339153 1.19 0.236 -.4921358 1.994715 4 | 1.686547 .8716593 1.93 0.053 -.0232138 3.396307 | smokeintensity | .0491365 .0517254 0.95 0.342 -.052323 .1505959 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028306 .0008493 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045525 .3142621 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048944 .0011616 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.450114 .7422889 1 | -.0579374 .4316468 -0.13 0.893 -.904613 .7887381 | active | 0 | .2613779 .6845577 0.38 0.703 -1.081382 1.604138 1 | -.6861916 .6739131 -1.02 0.309 -2.008073 .6356894 | wt71 | .0455018 .0833709 0.55 0.585 -.1180303 .2090339 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019945 .0000639 | qsmk#| c.smokeintensity | Smoking cessation | .0466628 .0351448 1.33 0.184 -.0222737 .1155993 | _cons | -1.690608 4.388883 -0.39 0.700 -10.2994 6.918188 ------------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 2.6383 3.034683 -10.87582 9.876489 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 1.756213 2.826271 -11.83737 6.733498 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 5.273587 2.920532 -9.091126 11.0506 observe[4,2] interv value observed -1 2.6382998 E(Y(a=0)) 0 1.7562131 E(Y(a=1)) 1 5.2735873 difference . 3.5173742 (saving observe[4,2]) file ./data/observe.mmat saved (3,132 observations deleted) (1,566 missing values generated) Program 13.4 Computing the 95% confidence interval of the standardized means and their difference: Data from NHEFS Section 13.3 *Run program 13.3 to obtain point estimates, and then the code below* capture program drop bootstdz program define bootstdz, rclass use ./data/nhefs_std, clear preserve * Draw bootstrap sample from original observations bsample /* Create copies with each value of qsmk in bootstrap sample. First, duplicate the dataset and create a variable `interv` which indicates which copy is the duplicate (interv =1)*/ expand 2, generate(interv_b) /* Next, duplicate the original copy (interv = 0) again, and create another variable `interv2` to indicate the copy*/ expand 2 if interv_b == 0, generate(interv2_b) /* Now, change the value of interv to -1 in one of the copies so that there are unique values of interv for each copy*/ replace interv_b = -1 if interv2_b ==1 drop interv2_b /* Two of the copies will be for computing the standardized result. For these two copies (interv = 0 and interv = 1), set the outcome to missing and force qsmk to either 0 or 1, respectively*/ replace wt82_71 = . if interv_b != -1 replace qsmk = 0 if interv_b == 0 replace qsmk = 1 if interv_b == 1 * Run regression regress wt82_71 qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// qsmk#c.smokeintensity /* Ask Stata for expected values. Stata will give you expected values for all copies, not just the original ones*/ predict predY_b, xb summarize predY_b if interv_b == 0 return scalar boot_0 = r(mean) summarize predY_b if interv_b == 1 return scalar boot_1 = r(mean) return scalar boot_diff = return(boot_1) - return(boot_0) drop meanY_b restore end /* Then we use the `simulate` command to run the bootstraps as many times as we want. Start with reps(10) to make sure your code runs, and then change to reps(1000) to generate your final CIs.*/ simulate EY_a0=r(boot_0) EY_a1 = r(boot_1) /// difference = r(boot_diff), reps(10) seed(1): bootstdz /* Next, format the point estimate to allow Stata to calculate our standard errors and confidence intervals*/ * Addition: read back in the observe matrix mata mata matuse ./data/observe, replace mata st_matrix(&quot;observe&quot;, observe) matrix pe = observe[2..4, 2]&#39; matrix list pe /* Finally, the bstat command generates valid 95% confidence intervals under the normal approximation using our bootstrap results. The default results use a normal approximation to calcutlate the confidence intervals. Note, n contains the original sample size of your data before censoring*/ bstat, stat(pe) n(1629) 12. Command: bootstdz EY_a0: r(boot_0) EY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done (loading observe[4,2]) pe[1,3] r2 r3 r4 c2 1.7562131 5.2735873 3.5173742 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.756213 .2157234 8.14 0.000 1.333403 2.179023 EY_a1 | 5.273587 .4999001 10.55 0.000 4.293801 6.253374 difference | 3.517374 .538932 6.53 0.000 2.461087 4.573662 ------------------------------------------------------------------------------ "],["g-estimation-of-structural-nested-models-stata.html", "14. G-estimation of Structural Nested Models: Stata Program 14.1 Program 14.2 Program 14.3", " 14. G-estimation of Structural Nested Models: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 14.1 Ranks of extreme observations Data from NHEFS Section 14.4 /*For Stata 15 or later, first install the extremes function using this code:*/ * ssc install extremes *Data preprocessing*** use ./data/nhefs, clear gen byte cens = (wt82 == .) /*Ranking of extreme observations*/ extremes wt82_71 seqn /*Estimate unstabilized censoring weights for use in g-estimation models*/ glm cens qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// , family(binomial) predict pr_cens gen w_cens = 1/(1-pr_cens) replace w_cens = . if cens == 1 /*observations with cens = 1 contribute to censoring models but not outcome model*/ summarize w_cens /*Analyses restricted to N=1566*/ drop if wt82 == . summarize wt82_71 save ./data/nhefs-wcens, replace | obs: wt82_71 seqn | |------------------------------| | 1329. -41.28046982 23321 | | 527. -30.50192161 13593 | | 1515. -30.05007421 24363 | | 204. -29.02579305 5412 | | 1067. -25.97055814 21897 | +------------------------------+ +-----------------------------+ | 205. 34.01779932 5415 | | 1145. 36.96925111 22342 | | 64. 37.65051215 1769 | | 260. 47.51130337 6928 | | 1367. 48.53838568 23522 | +-----------------------------+ Iteration 0: Log likelihood = -292.45812 Iteration 1: Log likelihood = -233.5099 Iteration 2: Log likelihood = -232.68635 Iteration 3: Log likelihood = -232.68 Iteration 4: Log likelihood = -232.67999 Generalized linear models Number of obs = 1,629 Optimization : ML Residual df = 1,609 Scale parameter = 1 Deviance = 465.3599898 (1/df) Deviance = .2892231 Pearson = 1654.648193 (1/df) Pearson = 1.028371 Variance function: V(u) = u*(1-u) [Bernoulli] Link function : g(u) = ln(u/(1-u)) [Logit] AIC = .3102271 Log likelihood = -232.6799949 BIC = -11434.36 ----------------------------------------------------------------------------------- | OIM cens | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | .5168674 .2877162 1.80 0.072 -.0470459 1.080781 sex | .0573131 .3302775 0.17 0.862 -.590019 .7046452 race | -.0122715 .4524888 -0.03 0.978 -.8991332 .8745902 age | -.2697293 .1174647 -2.30 0.022 -.4999558 -.0395027 | c.age#c.age | .0028837 .0011135 2.59 0.010 .0007012 .0050661 | education | 1 | .3823818 .5601808 0.68 0.495 -.7155523 1.480316 2 | -.0584066 .5749586 -0.10 0.919 -1.185305 1.068491 3 | .2176937 .5225008 0.42 0.677 -.8063891 1.241776 4 | .5208288 .6678735 0.78 0.435 -.7881792 1.829837 | smokeintensity | .0157119 .0347319 0.45 0.651 -.0523614 .0837851 | c.smokeintensity#| c.smokeintensity | -.0001133 .0006058 -0.19 0.852 -.0013007 .0010742 | smokeyrs | .0785973 .0749576 1.05 0.294 -.068317 .2255116 | c.smokeyrs#| c.smokeyrs | -.0005569 .0010318 -0.54 0.589 -.0025791 .0014653 | exercise | 0 | .583989 .3723133 1.57 0.117 -.1457317 1.31371 1 | -.3874824 .3439133 -1.13 0.260 -1.06154 .2865753 | active | 0 | -.7065829 .3964577 -1.78 0.075 -1.483626 .0704599 1 | -.9540614 .3893181 -2.45 0.014 -1.717111 -.1910119 | wt71 | -.0878871 .0400115 -2.20 0.028 -.1663082 -.0094659 | c.wt71#c.wt71 | .0006351 .0002257 2.81 0.005 .0001927 .0010775 | _cons | 3.754678 2.651222 1.42 0.157 -1.441622 8.950978 ----------------------------------------------------------------------------------- (option mu assumed; predicted mean cens) (63 real changes made, 63 to missing) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- w_cens | 1,566 1.039197 .05646 1.001814 1.824624 (63 observations deleted) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- wt82_71 | 1,566 2.6383 7.879913 -41.28047 48.53839 file ./data/nhefs-wcens.dta saved Program 14.2 G-estimation of a 1-parameter structural nested mean model Brute force search Data from NHEFS Section 14.5 use ./data/nhefs-wcens, clear /*Generate test value of Psi = 3.446*/ gen psi = 3.446 /*Generate H(Psi) for each individual using test value of Psi and their own values of weight change and smoking status*/ gen Hpsi = wt82_71 - psi * qsmk /*Fit a model for smoking status, given confounders and H(Psi) value, with censoring weights and display H(Psi) coefficient*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 Hpsi /// [pw = w_cens], cluster(seqn) di _b[Hpsi] /*G-estimation*/ /*Checking multiple possible values of psi*/ cap noi drop psi Hpsi local seq_start = 2 local seq_end = 5 local seq_by = 0.1 // Setting seq_by = 0.01 will yield the result 3.46 local seq_len = (`seq_end&#39;-`seq_start&#39;)/`seq_by&#39; + 1 matrix results = J(`seq_len&#39;, 4, 0) qui gen psi = . qui gen Hpsi = . local j = 0 forvalues i = `seq_start&#39;(`seq_by&#39;)`seq_end&#39; { local j = `j&#39; + 1 qui replace psi = `i&#39; qui replace Hpsi = wt82_71 - psi * qsmk quietly logit qsmk sex race c.age##c.age /// ib(last).education c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 Hpsi /// [pw = w_cens], cluster(seqn) matrix p_mat = r(table) matrix p_mat = p_mat[&quot;pvalue&quot;,&quot;qsmk:Hpsi&quot;] local p = p_mat[1,1] local b = _b[Hpsi] di &quot;coeff&quot;, %6.3f `b&#39;, &quot;is generated from psi&quot;, %4.1f `i&#39; matrix results[`j&#39;,1]= `i&#39; matrix results[`j&#39;,2]= `b&#39; matrix results[`j&#39;,3]= abs(`b&#39;) matrix results[`j&#39;,4]= `p&#39; } matrix colnames results = &quot;psi&quot; &quot;B(Hpsi)&quot; &quot;AbsB(Hpsi)&quot; &quot;pvalue&quot; mat li results mata res = st_matrix(&quot;results&quot;) for(i=1; i&lt;= rows(res); i++) { if (res[i,3] == colmin(res[,3])) res[i,1] } end * Setting seq_by = 0.01 will yield the result 3.46 Iteration 0: Log pseudolikelihood = -936.10067 Iteration 1: Log pseudolikelihood = -879.13942 Iteration 2: Log pseudolikelihood = -877.82647 Iteration 3: Log pseudolikelihood = -877.82423 Iteration 4: Log pseudolikelihood = -877.82423 Logistic regression Number of obs = 1,566 Wald chi2(19) = 106.13 Prob &gt; chi2 = 0.0000 Log pseudolikelihood = -877.82423 Pseudo R2 = 0.0623 (Std. err. adjusted for 1,566 clusters in seqn) ----------------------------------------------------------------------------------- | Robust qsmk | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5137324 .1536024 -3.34 0.001 -.8147876 -.2126772 race | -.8608912 .2099415 -4.10 0.000 -1.272369 -.4494133 age | .1151589 .0502116 2.29 0.022 .016746 .2135718 | c.age#c.age | -.0007593 .0005297 -1.43 0.152 -.0017976 .000279 | education | 1 | -.4710855 .2247701 -2.10 0.036 -.9116268 -.0305441 2 | -.5000231 .2208583 -2.26 0.024 -.9328974 -.0671487 3 | -.3833788 .195914 -1.96 0.050 -.7673632 .0006056 4 | -.4047116 .2836068 -1.43 0.154 -.9605707 .1511476 | smokeintensity | -.0783425 .014645 -5.35 0.000 -.1070461 -.0496389 | c.smokeintensity#| c.smokeintensity | .0010722 .0002651 4.04 0.000 .0005526 .0015917 | smokeyrs | -.0711097 .026398 -2.69 0.007 -.1228488 -.0193705 | c.smokeyrs#| c.smokeyrs | .0008153 .0004491 1.82 0.069 -.000065 .0016955 | exercise | 0 | -.3800465 .1889205 -2.01 0.044 -.7503238 -.0097692 1 | -.0437043 .1372725 -0.32 0.750 -.3127534 .2253447 | active | 0 | -.2134552 .2122025 -1.01 0.314 -.6293645 .2024541 1 | -.1793327 .207151 -0.87 0.387 -.5853412 .2266758 | wt71 | -.0076607 .0256319 -0.30 0.765 -.0578983 .0425769 | c.wt71#c.wt71 | .0000866 .0001582 0.55 0.584 -.0002236 .0003967 | Hpsi | -1.90e-06 .0088414 -0.00 1.000 -.0173307 .0173269 _cons | -1.338367 1.359613 -0.98 0.325 -4.00316 1.326426 ----------------------------------------------------------------------------------- -1.905e-06 6. matrix p_mat = r(table) 7. matrix p_mat = p_mat[&quot;pvalue&quot;,&quot;qsmk:Hpsi&quot;] 8. local p = p_mat[1,1] 9. local b = _b[Hpsi] 10. di &quot;coeff&quot;, %6.3f `b&#39;, &quot;is generated from psi&quot;, %4.1f `i&#39; 11. matrix results[`j&#39;,1]= `i&#39; 12. matrix results[`j&#39;,2]= `b&#39; 13. matrix results[`j&#39;,3]= abs(`b&#39;) 14. matrix results[`j&#39;,4]= `p&#39; 15. } coeff 0.027 is generated from psi 2.0 coeff 0.025 is generated from psi 2.1 coeff 0.023 is generated from psi 2.2 coeff 0.021 is generated from psi 2.3 coeff 0.019 is generated from psi 2.4 coeff 0.018 is generated from psi 2.5 coeff 0.016 is generated from psi 2.6 coeff 0.014 is generated from psi 2.7 coeff 0.012 is generated from psi 2.8 coeff 0.010 is generated from psi 2.9 coeff 0.008 is generated from psi 3.0 coeff 0.006 is generated from psi 3.1 coeff 0.005 is generated from psi 3.2 coeff 0.003 is generated from psi 3.3 coeff 0.001 is generated from psi 3.4 coeff -0.001 is generated from psi 3.5 coeff -0.003 is generated from psi 3.6 coeff -0.005 is generated from psi 3.7 coeff -0.007 is generated from psi 3.8 coeff -0.009 is generated from psi 3.9 coeff -0.011 is generated from psi 4.0 coeff -0.012 is generated from psi 4.1 coeff -0.014 is generated from psi 4.2 coeff -0.016 is generated from psi 4.3 coeff -0.018 is generated from psi 4.4 coeff -0.020 is generated from psi 4.5 coeff -0.022 is generated from psi 4.6 coeff -0.024 is generated from psi 4.7 coeff -0.026 is generated from psi 4.8 coeff -0.028 is generated from psi 4.9 coeff -0.030 is generated from psi 5.0 results[31,4] psi B(Hpsi) AbsB(Hpsi) pvalue r1 2 .02672188 .02672188 .00177849 r2 2.1 .02489456 .02489456 .00359089 r3 2.2 .02306552 .02306552 .00698119 r4 2.3 .02123444 .02123444 .01305479 r5 2.4 .01940095 .01940095 .02346121 r6 2.5 .01756472 .01756472 .04049437 r7 2.6 .0157254 .0157254 .06710192 r8 2.7 .01388267 .01388267 .10673812 r9 2.8 .0120362 .0120362 .16301154 r10 2.9 .01018567 .01018567 .23912864 r11 3 .00833081 .00833081 .33720241 r12 3.1 .00647131 .00647131 .45757692 r13 3.2 .0046069 .0046069 .59835195 r14 3.3 .00273736 .00273736 .75528009 r15 3.4 .00086243 .00086243 .92212566 r16 3.5 -.00101809 .00101809 .90856559 r17 3.6 -.00290439 .00290439 .7444406 r18 3.7 -.00479666 .00479666 .59230593 r19 3.8 -.00669505 .00669505 .45731304 r20 3.9 -.00859969 .00859969 .3425138 r21 4 -.01051072 .01051072 .2488326 r22 4.1 -.01242824 .01242824 .17537691 r23 4.2 -.01435235 .01435235 .1199593 r24 4.3 -.01628313 .01628313 .07967563 r25 4.4 -.01822063 .01822063 .05142147 r26 4.5 -.02016492 .02016492 .03227271 r27 4.6 -.02211603 .02211603 .01971433 r28 4.7 -.02407401 .02407401 .01173271 r29 4.8 -.02603888 .02603888 .00680955 r30 4.9 -.02801063 .02801063 .00385828 r31 5 -.02998926 .02998926 .00213639 ------------------------------------------------- mata (type end to exit) ------------ : res = st_matrix(&quot;results&quot;) : for(i=1; i&lt;= rows(res); i++) { &gt; if (res[i,3] == colmin(res[,3])) res[i,1] &gt; } 3.4 : end -------------------------------------------------------------------------------------- Program 14.3 G-estimation for 2-parameter structural nested mean model Closed form estimator Data from NHEFS Section 14.6 use ./data/nhefs-wcens, clear /*create weights*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /// [pw = w_cens], cluster(seqn) predict pr_qsmk summarize pr_qsmk /* Closed form estimator linear mean models **/ * ssc install tomata putmata *, replace mata: diff = qsmk - pr_qsmk mata: part1 = w_cens :* wt82_71 :* diff mata: part2 = w_cens :* qsmk :* diff mata: psi = sum(part1)/sum(part2) /*** Closed form estimator for 2-parameter model **/ mata diff = qsmk - pr_qsmk diff2 = w_cens :* diff lhs = J(2,2, 0) lhs[1,1] = sum( qsmk :* diff2) lhs[1,2] = sum( qsmk :* smokeintensity :* diff2 ) lhs[2,1] = sum( qsmk :* smokeintensity :* diff2) lhs[2,2] = sum( qsmk :* smokeintensity :* smokeintensity :* diff2 ) rhs = J(2,1,0) rhs[1] = sum(wt82_71 :* diff2 ) rhs[2] = sum(wt82_71 :* smokeintensity :* diff2 ) psi = (lusolve(lhs, rhs))&#39; psi psi = (invsym(lhs&#39;lhs)*lhs&#39;rhs)&#39; psi end Iteration 0: Log pseudolikelihood = -936.10067 Iteration 1: Log pseudolikelihood = -879.13943 Iteration 2: Log pseudolikelihood = -877.82647 Iteration 3: Log pseudolikelihood = -877.82423 Iteration 4: Log pseudolikelihood = -877.82423 Logistic regression Number of obs = 1,566 Wald chi2(18) = 106.13 Prob &gt; chi2 = 0.0000 Log pseudolikelihood = -877.82423 Pseudo R2 = 0.0623 (Std. err. adjusted for 1,566 clusters in seqn) ----------------------------------------------------------------------------------- | Robust qsmk | Coefficient std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5137295 .1533507 -3.35 0.001 -.8142913 -.2131677 race | -.8608919 .2099555 -4.10 0.000 -1.272397 -.4493867 age | .1151581 .0503079 2.29 0.022 .0165564 .2137598 | c.age#c.age | -.0007593 .00053 -1.43 0.152 -.0017981 .0002795 | education | 1 | -.4710854 .2247796 -2.10 0.036 -.9116454 -.0305255 2 | -.5000247 .220776 -2.26 0.024 -.9327378 -.0673116 3 | -.3833802 .1954991 -1.96 0.050 -.7665515 -.0002089 4 | -.4047148 .2833093 -1.43 0.153 -.9599908 .1505613 | smokeintensity | -.0783426 .0146634 -5.34 0.000 -.1070824 -.0496029 | c.smokeintensity#| c.smokeintensity | .0010722 .0002655 4.04 0.000 .0005518 .0015925 | smokeyrs | -.0711099 .0263523 -2.70 0.007 -.1227596 -.0194602 | c.smokeyrs#| c.smokeyrs | .0008153 .0004486 1.82 0.069 -.0000639 .0016945 | exercise | 0 | -.3800461 .1890123 -2.01 0.044 -.7505034 -.0095887 1 | -.0437044 .137269 -0.32 0.750 -.3127467 .225338 | active | 0 | -.2134564 .2121759 -1.01 0.314 -.6293135 .2024007 1 | -.1793322 .2070848 -0.87 0.386 -.5852109 .2265466 | wt71 | -.0076609 .0255841 -0.30 0.765 -.0578048 .042483 | c.wt71#c.wt71 | .0000866 .0001572 0.55 0.582 -.0002216 .0003947 | _cons | -1.338358 1.359289 -0.98 0.325 -4.002516 1.3258 ----------------------------------------------------------------------------------- (option pr assumed; Pr(qsmk)) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- pr_qsmk | 1,566 .2607709 .1177584 .0514466 .7891403 (68 vectors posted) ------------------------------------------------- mata (type end to exit) ------------ : diff = qsmk - pr_qsmk : diff2 = w_cens :* diff : : lhs = J(2,2, 0) : lhs[1,1] = sum( qsmk :* diff2) : lhs[1,2] = sum( qsmk :* smokeintensity :* diff2 ) : lhs[2,1] = sum( qsmk :* smokeintensity :* diff2) : lhs[2,2] = sum( qsmk :* smokeintensity :* smokeintensity :* diff2 ) : : rhs = J(2,1,0) : rhs[1] = sum(wt82_71 :* diff2 ) : rhs[2] = sum(wt82_71 :* smokeintensity :* diff2 ) : : psi = (lusolve(lhs, rhs))&#39; : psi 1 2 +-----------------------------+ 1 | 2.859470362 .0300412816 | +-----------------------------+ : psi = (invsym(lhs&#39;lhs)*lhs&#39;rhs)&#39; : psi 1 2 +-----------------------------+ 1 | 2.859470362 .0300412816 | +-----------------------------+ : end -------------------------------------------------------------------------------------- "],["outcome-regression-and-propensity-scores-stata.html", "15. Outcome regression and propensity scores: Stata Program 15.1 Prorgam 15.2 Program 15.3 Program 15.4", " 15. Outcome regression and propensity scores: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 15.1 Estimating the average causal effect within levels of confounders under the assumption of effect-measure modification by smoking intensity ONLY Data from NHEFS Section 15.1 use ./data/nhefs-formatted, clear /* Generate smoking intensity among smokers product term */ gen qsmkintensity = qsmk*smokeintensity * Regression on covariates, allowing for some effect modfication regress wt82_71 qsmk qsmkintensity /// c.smokeintensity##c.smokeintensity sex race c.age##c.age /// ib(last).education c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 /* Display the estimated mean difference between quitting and not quitting value when smoke intensity = 5 cigarettes/ day */ lincom 1*_b[qsmk] + 5*1*_b[qsmkintensity] /* Display the estimated mean difference between quitting and not quitting value when smoke intensity = 40 cigarettes/ day */ lincom 1*_b[qsmk] + 40*1*_b[qsmkintensity] /* Regression on covariates, with no product terms */ regress wt82_71 qsmk c.smokeintensity##c.smokeintensity /// sex race c.age##c.age /// ib(last).education c.smokeyrs##c.smokeyrs /// ib(last).exercise ib(last).active c.wt71##c.wt71 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(20, 1545) = 13.45 Model | 14412.558 20 720.6279 Prob &gt; F = 0.0000 Residual | 82763.0286 1,545 53.5683033 R-squared = 0.1483 -------------+---------------------------------- Adj R-squared = 0.1373 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.319 ----------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | 2.559594 .8091486 3.16 0.002 .9724486 4.14674 qsmkintensity | .0466628 .0351448 1.33 0.184 -.0222737 .1155993 smokeintensity | .0491365 .0517254 0.95 0.342 -.052323 .1505959 | c.smokeintensity#| c.smokeintensity | -.0009907 .000938 -1.06 0.291 -.0028306 .0008493 | sex | -1.430272 .4689576 -3.05 0.002 -2.350132 -.5104111 race | .5601096 .5818888 0.96 0.336 -.5812656 1.701485 age | .3596353 .1633188 2.20 0.028 .0392854 .6799851 | c.age#c.age | -.006101 .0017261 -3.53 0.000 -.0094868 -.0027151 | education | 1 | .194977 .7413692 0.26 0.793 -1.259219 1.649173 2 | .9854211 .7012116 1.41 0.160 -.390006 2.360848 3 | .7512894 .6339153 1.19 0.236 -.4921358 1.994715 4 | 1.686547 .8716593 1.93 0.053 -.0232138 3.396307 | smokeyrs | .1343686 .0917122 1.47 0.143 -.045525 .3142621 | c.smokeyrs#| c.smokeyrs | -.0018664 .0015437 -1.21 0.227 -.0048944 .0011616 | exercise | 0 | -.3539128 .5588587 -0.63 0.527 -1.450114 .7422889 1 | -.0579374 .4316468 -0.13 0.893 -.904613 .7887381 | active | 0 | .2613779 .6845577 0.38 0.703 -1.081382 1.604138 1 | -.6861916 .6739131 -1.02 0.309 -2.008073 .6356894 | wt71 | .0455018 .0833709 0.55 0.585 -.1180303 .2090339 | c.wt71#c.wt71 | -.0009653 .0005247 -1.84 0.066 -.0019945 .0000639 | _cons | -1.690608 4.388883 -0.39 0.700 -10.2994 6.918188 ----------------------------------------------------------------------------------- ( 1) qsmk + 5*qsmkintensity = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 2.792908 .6682596 4.18 0.000 1.482117 4.1037 ------------------------------------------------------------------------------ ( 1) qsmk + 40*qsmkintensity = 0 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- (1) | 4.426108 .8477818 5.22 0.000 2.763183 6.089032 ------------------------------------------------------------------------------ Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(19, 1546) = 14.06 Model | 14318.1239 19 753.58547 Prob &gt; F = 0.0000 Residual | 82857.4627 1,546 53.5947365 R-squared = 0.1473 -------------+---------------------------------- Adj R-squared = 0.1369 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.3208 ----------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] ------------------+---------------------------------------------------------------- qsmk | 3.462622 .4384543 7.90 0.000 2.602594 4.32265 smokeintensity | .0651533 .0503115 1.29 0.196 -.0335327 .1638392 | c.smokeintensity#| c.smokeintensity | -.0010468 .0009373 -1.12 0.264 -.0028853 .0007918 | sex | -1.46505 .468341 -3.13 0.002 -2.3837 -.5463989 race | .5864117 .5816949 1.01 0.314 -.5545827 1.727406 age | .3626624 .1633431 2.22 0.027 .0422649 .6830599 | c.age#c.age | -.0061377 .0017263 -3.56 0.000 -.0095239 -.0027515 | education | 1 | .1708264 .7413289 0.23 0.818 -1.28329 1.624943 2 | .9893527 .7013784 1.41 0.159 -.3864007 2.365106 3 | .7423268 .6340357 1.17 0.242 -.501334 1.985988 4 | 1.679344 .8718575 1.93 0.054 -.0308044 3.389492 | smokeyrs | .1333931 .0917319 1.45 0.146 -.0465389 .3133252 | c.smokeyrs#| c.smokeyrs | -.001827 .0015438 -1.18 0.237 -.0048552 .0012012 | exercise | 0 | -.3628786 .5589557 -0.65 0.516 -1.45927 .7335129 1 | -.0421962 .4315904 -0.10 0.922 -.8887606 .8043683 | active | 0 | .2580374 .6847219 0.38 0.706 -1.085044 1.601119 1 | -.68492 .6740787 -1.02 0.310 -2.007125 .6372851 | wt71 | .0373642 .0831658 0.45 0.653 -.1257655 .200494 | c.wt71#c.wt71 | -.0009158 .0005235 -1.75 0.080 -.0019427 .0001111 | _cons | -1.724603 4.389891 -0.39 0.694 -10.33537 6.886166 ----------------------------------------------------------------------------------- Prorgam 15.2 Estimating and plotting the propensity score Data from NHEFS Section 15.2 use ./data/nhefs-formatted, clear /*Fit a model for the exposure, quitting smoking*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 /*Estimate the propensity score, P(Qsmk|Covariates)*/ predict ps, pr /*Check the distribution of the propensity score*/ bys qsmk: summarize ps /*Return extreme values of propensity score: note, for Stata versions 15 and above, start by installing extremes*/ * ssc install extremes extremes ps seqn bys qsmk: extremes ps seqn save ./data/nhefs-ps, replace /*Plotting the estimated propensity score*/ histogram ps, width(0.05) start(0.025) /// frequency fcolor(none) lcolor(black) /// lpattern(solid) addlabel /// addlabopts(mlabcolor(black) mlabposition(12) /// mlabangle(zero)) /// ytitle(No. Subjects) ylabel(#4) /// xtitle(Estimated Propensity Score) xlabel(#15) /// by(, title(Estimated Propensity Score Distribution) /// subtitle(By Quit Smoking Status)) /// by(, legend(off)) /// by(qsmk, style(compact) colfirst) /// subtitle(, size(small) box bexpand) qui gr export ./figs/stata-fig-15-2.png, replace Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- -------------------------------------------------------------------------------------- -&gt; qsmk = No smoking cessation Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 1,163 .2392928 .1056545 .0510008 .6814955 -------------------------------------------------------------------------------------- -&gt; qsmk = Smoking cessation Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 403 .3094353 .1290642 .0598799 .7768887 +--------------------------+ | obs: ps seqn | |--------------------------| | 979. .0510008 22941 | | 945. .0527126 1769 | | 1023. .0558418 21140 | | 115. .0558752 2522 | | 478. .0567372 12639 | +--------------------------+ +--------------------------+ | 1173. .6659576 22272 | | 1033. .6814955 22773 | | 1551. .7166381 14983 | | 1494. .7200644 24817 | | 1303. .7768887 24949 | +--------------------------+ -------------------------------------------------------------------------------------- -&gt; qsmk = No smoking cessation +--------------------------+ | obs: ps seqn | |--------------------------| | 979. .0510008 22941 | | 945. .0527126 1769 | | 1023. .0558418 21140 | | 115. .0558752 2522 | | 478. .0567372 12639 | +--------------------------+ +--------------------------+ | 463. .6337243 17096 | | 812. .6345721 17768 | | 707. .6440308 19147 | | 623. .6566707 21983 | | 1033. .6814955 22773 | +--------------------------+ -------------------------------------------------------------------------------------- -&gt; qsmk = Smoking cessation +--------------------------+ | obs: ps seqn | |--------------------------| | 1223. .0598799 4289 | | 1283. .0600822 23550 | | 1253. .0806089 24306 | | 1467. .0821677 22904 | | 1165. .1021875 24584 | +--------------------------+ +--------------------------+ | 1399. .635695 17738 | | 1173. .6659576 22272 | | 1551. .7166381 14983 | | 1494. .7200644 24817 | | 1303. .7768887 24949 | +--------------------------+ file ./data/nhefs-ps.dta saved Program 15.3 Stratification and outcome regression using deciles of the propensity score Data from NHEFS Section 15.3 Note: Stata decides borderline cutpoints differently from SAS, so, despite identically distributed propensity scores, the results of regression using deciles are not an exact match with the book. use ./data/nhefs-ps, clear /*Calculation of deciles of ps*/ xtile ps_dec = ps, nq(10) by ps_dec, sort: summarize ps /*Stratification on PS deciles, allowing for effect modification*/ /*Note: Stata compares qsmk 0 vs qsmk 1, so the coefficients are reversed relative to the book*/ by ps_dec: ttest wt82_71, by(qsmk) /*Regression on PS deciles, with no product terms*/ regress wt82_71 qsmk ib(last).ps_dec -&gt; ps_dec = 1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .0976251 .0185215 .0510008 .1240482 -------------------------------------------------------------------------------------- -&gt; ps_dec = 2 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .1430792 .0107751 .1241923 .1603558 -------------------------------------------------------------------------------------- -&gt; ps_dec = 3 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .1750423 .008773 .1606041 .1893271 -------------------------------------------------------------------------------------- -&gt; ps_dec = 4 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2014066 .0062403 .189365 .2121815 -------------------------------------------------------------------------------------- -&gt; ps_dec = 5 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .2245376 .0073655 .2123068 .237184 -------------------------------------------------------------------------------------- -&gt; ps_dec = 6 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2515298 .0078777 .2377578 .2655718 -------------------------------------------------------------------------------------- -&gt; ps_dec = 7 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .2827476 .0099986 .2655724 .2994968 -------------------------------------------------------------------------------------- -&gt; ps_dec = 8 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .3204104 .0125102 .2997581 .3438773 -------------------------------------------------------------------------------------- -&gt; ps_dec = 9 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 157 .375637 .0221347 .3439862 .4174631 -------------------------------------------------------------------------------------- -&gt; ps_dec = 10 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- ps | 156 .5026508 .0733494 .4176717 .7768887 -------------------------------------------------------------------------------------- -&gt; ps_dec = 1 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 146 3.74236 .6531341 7.891849 2.451467 5.033253 Smoking | 11 3.949703 2.332995 7.737668 -1.248533 9.14794 ---------+-------------------------------------------------------------------- Combined | 157 3.756887 .6270464 7.856869 2.51829 4.995484 ---------+-------------------------------------------------------------------- diff | -.2073431 2.464411 -5.075509 4.660822 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -0.0841 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.4665 Pr(|T| &gt; |t|) = 0.9331 Pr(T &gt; t) = 0.5335 -------------------------------------------------------------------------------------- -&gt; ps_dec = 2 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 134 2.813019 .589056 6.818816 1.647889 3.978149 Smoking | 23 7.726944 1.260784 6.046508 5.112237 10.34165 ---------+-------------------------------------------------------------------- Combined | 157 3.532893 .5519826 6.916322 2.442569 4.623217 ---------+-------------------------------------------------------------------- diff | -4.913925 1.515494 -7.907613 -1.920237 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.2425 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0007 Pr(|T| &gt; |t|) = 0.0015 Pr(T &gt; t) = 0.9993 -------------------------------------------------------------------------------------- -&gt; ps_dec = 3 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 128 3.25684 .5334655 6.035473 2.201209 4.312472 Smoking | 28 7.954974 1.418184 7.504324 5.045101 10.86485 ---------+-------------------------------------------------------------------- Combined | 156 4.100095 .5245749 6.551938 3.063857 5.136334 ---------+-------------------------------------------------------------------- diff | -4.698134 1.318074 -7.301973 -2.094294 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.5644 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0002 Pr(|T| &gt; |t|) = 0.0005 Pr(T &gt; t) = 0.9998 -------------------------------------------------------------------------------------- -&gt; ps_dec = 4 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 121 3.393929 .5267602 5.794362 2.350981 4.436877 Smoking | 36 5.676072 1.543143 9.258861 2.543324 8.808819 ---------+-------------------------------------------------------------------- Combined | 157 3.917223 .5412091 6.78133 2.848179 4.986266 ---------+-------------------------------------------------------------------- diff | -2.282143 1.278494 -4.807663 .2433778 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -1.7850 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0381 Pr(|T| &gt; |t|) = 0.0762 Pr(T &gt; t) = 0.9619 -------------------------------------------------------------------------------------- -&gt; ps_dec = 5 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 119 1.368438 .8042619 8.773461 -.2242199 2.961095 Smoking | 37 5.195421 1.388723 8.44727 2.378961 8.011881 ---------+-------------------------------------------------------------------- Combined | 156 2.27612 .7063778 8.822656 .8807499 3.671489 ---------+-------------------------------------------------------------------- diff | -3.826983 1.637279 -7.061407 -.592559 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -2.3374 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0104 Pr(|T| &gt; |t|) = 0.0207 Pr(T &gt; t) = 0.9896 -------------------------------------------------------------------------------------- -&gt; ps_dec = 6 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 112 2.25564 .6850004 7.249362 .8982664 3.613014 Smoking | 45 7.199088 1.724899 11.57097 3.722782 10.67539 ---------+-------------------------------------------------------------------- Combined | 157 3.672552 .7146582 8.954642 2.260897 5.084207 ---------+-------------------------------------------------------------------- diff | -4.943447 1.535024 -7.975714 -1.911181 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -3.2204 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0008 Pr(|T| &gt; |t|) = 0.0016 Pr(T &gt; t) = 0.9992 -------------------------------------------------------------------------------------- -&gt; ps_dec = 7 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 116 .7948483 .7916172 8.525978 -.773193 2.36289 Smoking | 41 6.646091 1.00182 6.414778 4.621337 8.670844 ---------+-------------------------------------------------------------------- Combined | 157 2.32288 .6714693 8.413486 .9965349 3.649225 ---------+-------------------------------------------------------------------- diff | -5.851242 1.45977 -8.734853 -2.967632 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -4.0083 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0000 Pr(|T| &gt; |t|) = 0.0001 Pr(T &gt; t) = 1.0000 -------------------------------------------------------------------------------------- -&gt; ps_dec = 8 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 107 1.063848 .5840159 6.041107 -.0940204 2.221716 Smoking | 49 3.116263 1.113479 7.794356 .8774626 5.355063 ---------+-------------------------------------------------------------------- Combined | 156 1.708517 .5352016 6.684666 .6512864 2.765747 ---------+-------------------------------------------------------------------- diff | -2.052415 1.144914 -4.31418 .2093492 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -1.7926 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0375 Pr(|T| &gt; |t|) = 0.0750 Pr(T &gt; t) = 0.9625 -------------------------------------------------------------------------------------- -&gt; ps_dec = 9 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 100 -.0292906 .7637396 7.637396 -1.544716 1.486134 Smoking | 57 .9112647 .9969309 7.526663 -1.085828 2.908357 ---------+-------------------------------------------------------------------- Combined | 157 .3121849 .6054898 7.586766 -.8838316 1.508201 ---------+-------------------------------------------------------------------- diff | -.9405554 1.26092 -3.43136 1.550249 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -0.7459 H0: diff = 0 Degrees of freedom = 155 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.2284 Pr(|T| &gt; |t|) = 0.4568 Pr(T &gt; t) = 0.7716 -------------------------------------------------------------------------------------- -&gt; ps_dec = 10 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- No smoki | 80 -.768504 .9224756 8.250872 -2.604646 1.067638 Smoking | 76 2.39532 1.053132 9.180992 .2973737 4.493267 ---------+-------------------------------------------------------------------- Combined | 156 .7728463 .7071067 8.831759 -.6239631 2.169656 ---------+-------------------------------------------------------------------- diff | -3.163824 1.396178 -5.921957 -.405692 ------------------------------------------------------------------------------ diff = mean(No smoki) - mean(Smoking) t = -2.2661 H0: diff = 0 Degrees of freedom = 154 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.0124 Pr(|T| &gt; |t|) = 0.0248 Pr(T &gt; t) = 0.9876 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(10, 1555) = 9.87 Model | 5799.7817 10 579.97817 Prob &gt; F = 0.0000 Residual | 91375.8049 1,555 58.7625755 R-squared = 0.0597 -------------+---------------------------------- Adj R-squared = 0.0536 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.6657 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 3.356927 .4580399 7.33 0.000 2.458486 4.255368 | ps_dec | 1 | 4.384269 .8873947 4.94 0.000 2.643652 6.124885 2 | 3.903694 .8805212 4.43 0.000 2.17656 5.630828 3 | 4.36015 .8793345 4.96 0.000 2.635343 6.084956 4 | 4.010061 .8745966 4.59 0.000 2.294548 5.725575 5 | 2.342505 .8754878 2.68 0.008 .6252438 4.059766 6 | 3.572955 .8714389 4.10 0.000 1.863636 5.282275 7 | 2.30881 .8727462 2.65 0.008 .5969261 4.020693 8 | 1.516677 .8715796 1.74 0.082 -.1929182 3.226273 9 | -.0439923 .8684465 -0.05 0.960 -1.747442 1.659457 | _cons | -.8625798 .6530529 -1.32 0.187 -2.143537 .4183773 ------------------------------------------------------------------------------ Program 15.4 Standardization and outcome regression using the propensity score Data from NHEFS Section 15.3 use ./data/nhefs-formatted, clear /*Estimate the propensity score*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 predict ps, pr /*Expand the dataset for standardization*/ expand 2, generate(interv) expand 2 if interv == 0, generate(interv2) replace interv = -1 if interv2 ==1 drop interv2 tab interv replace wt82_71 = . if interv != -1 replace qsmk = 0 if interv == 0 replace qsmk = 1 if interv == 1 by interv, sort: summarize qsmk /*Regression on the propensity score, allowing for effect modification*/ regress wt82_71 qsmk##c.ps predict predY, xb by interv, sort: summarize predY quietly summarize predY if(interv == -1) matrix input observe = (-1,`r(mean)&#39;) quietly summarize predY if(interv == 0) matrix observe = (observe \\0,`r(mean)&#39;) quietly summarize predY if(interv == 1) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\., observe[3,2]-observe[2,2]) matrix rownames observe = observed E(Y(a=0)) E(Y(a=1)) difference matrix colnames observe = interv value matrix list observe /*bootstrap program*/ drop if interv != -1 gen meanY_b =. qui save ./data/nhefs_std, replace capture program drop bootstdz program define bootstdz, rclass use ./data/nhefs_std, clear preserve bsample /*Create 2 new copies of the data. Set the outcome AND the exposure to missing in the copies*/ expand 2, generate(interv_b) expand 2 if interv_b == 0, generate(interv2_b) qui replace interv_b = -1 if interv2_b ==1 qui drop interv2_b qui replace wt82_71 = . if interv_b != -1 qui replace qsmk = . if interv_b != -1 /*Fit the propensity score in the original data (where qsmk is not missing) and generate predictions for everyone*/ logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 predict ps_b, pr /*Set the exposure to 0 for everyone in copy 0, and 1 to everyone for copy 1*/ qui replace qsmk = 0 if interv_b == 0 qui replace qsmk = 1 if interv_b == 1 /*Fit the outcome regression in the original data (where wt82_71 is not missing) and generate predictions for everyone*/ regress wt82_71 qsmk##c.ps predict predY_b, xb /*Summarize the predictions in each set of copies*/ summarize predY_b if interv_b == 0 return scalar boot_0 = r(mean) summarize predY_b if interv_b == 1 return scalar boot_1 = r(mean) return scalar boot_diff = return(boot_1) - return(boot_0) qui drop meanY_b restore end /*Then we use the `simulate` command to run the bootstraps as many times as we want. Start with reps(10) to make sure your code runs, and then change to reps(1000) to generate your final CIs*/ simulate EY_a0=r(boot_0) EY_a1 = r(boot_1) /// difference = r(boot_diff), reps(500) seed(1): bootstdz matrix pe = observe[2..4, 2]&#39; matrix list pe bstat, stat(pe) n(1629) estat bootstrap, p Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- (1,566 observations created) (1,566 observations created) (1,566 real changes made) Expanded observation | type | Freq. Percent Cum. -----------------------+----------------------------------- -1 | 1,566 33.33 33.33 Original observation | 1,566 33.33 66.67 Duplicated observation | 1,566 33.33 100.00 -----------------------+----------------------------------- Total | 4,698 100.00 (3,132 real changes made, 3,132 to missing) (403 real changes made) (1,163 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 .2573436 .4373099 0 1 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 0 0 0 0 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- qsmk | 1,566 1 0 1 1 Source | SS df MS Number of obs = 1,566 -------------+---------------------------------- F(3, 1562) = 29.96 Model | 5287.31428 3 1762.43809 Prob &gt; F = 0.0000 Residual | 91888.2723 1,562 58.827319 R-squared = 0.0544 -------------+---------------------------------- Adj R-squared = 0.0526 Total | 97175.5866 1,565 62.0930266 Root MSE = 7.6699 ------------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. t P&gt;|t| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | Smoking cessation | 4.036457 1.13904 3.54 0.000 1.80225 6.270665 ps | -12.3319 2.129602 -5.79 0.000 -16.50908 -8.154716 | qsmk#c.ps | Smoking cessation | -2.038829 3.649684 -0.56 0.576 -9.197625 5.119967 | _cons | 4.935432 .5570216 8.86 0.000 3.842843 6.028021 ------------------------------------------------------------------------------------ -------------------------------------------------------------------------------------- -&gt; interv = -1 Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 2.6383 1.838063 -3.4687 8.111371 -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 1.761898 1.433264 -4.645079 4.306496 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- predY | 1,566 5.273676 1.670225 -2.192565 8.238971 observe[4,2] interv value observed -1 2.6382998 E(Y(a=0)) 0 1.7618979 E(Y(a=1)) 1 5.2736757 difference . 3.5117778 (3,132 observations deleted) (1,566 missing values generated) 11. predict ps_b, pr 12. Command: bootstdz EY_a0: r(boot_0) EY_a1: r(boot_1) difference: r(boot_diff) Simulations (500): .........10.........20.........30.........40.........50.........60. &gt; ........70.........80.........90.........100.........110.........120.........130.... &gt; .....140.........150.........160.........170.........180.........190.........200.... &gt; .....210.........220.........230.........240.........250.........260.........270.... &gt; .....280.........290.........300.........310.........320.........330.........340.... &gt; .....350.........360.........370.........380.........390.........400.........410.... &gt; .....420.........430.........440.........450.........460.........470.........480.... &gt; .....490.........500 done pe[1,3] E(Y(a=0)) E(Y(a=1)) difference value 1.7618979 5.2736757 3.5117778 Bootstrap results Number of obs = 1,629 Replications = 500 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.761898 .2255637 7.81 0.000 1.319801 2.203995 EY_a1 | 5.273676 .4695378 11.23 0.000 4.353399 6.193953 difference | 3.511778 .4970789 7.06 0.000 2.537521 4.486035 ------------------------------------------------------------------------------ Bootstrap results Number of obs = 1,629 Replications = 500 ------------------------------------------------------------------------------ | Observed Bootstrap | coefficient Bias std. err. [95% conf. interval] -------------+---------------------------------------------------------------- EY_a0 | 1.7618979 .0026735 .22556365 1.269908 2.186845 (P) EY_a1 | 5.2736757 -.0049491 .46953779 4.34944 6.109205 (P) difference | 3.5117778 -.0076226 .49707894 2.466025 4.424034 (P) ------------------------------------------------------------------------------ Key: P: Percentile "],["instrumental-variables-estimation-stata.html", "16. Instrumental variables estimation: Stata Program 16.1 Program 16.2 Program 16.3 Program 16.4 Program 16.5", " 16. Instrumental variables estimation: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 16.1 Estimating the average causal effect using the standard IV estimator via the calculation of sample averages Data from NHEFS Section 16.2 use ./data/nhefs-formatted, clear summarize price82 /* ignore subjects with missing outcome or missing instrument for simplicity*/ foreach var of varlist wt82 price82 { drop if `var&#39;==. } /*Create categorical instrument*/ gen byte highprice = (price82 &gt; 1.5 &amp; price82 &lt; .) save ./data/nhefs-highprice, replace /*Calculate P[Z|A=a]*/ tab highprice qsmk, row /*Calculate P[Y|Z=z]*/ ttest wt82_71, by(highprice) /*Final IV estimate, OPTION 1: Hand calculations*/ /*Numerator: num = E[Y|Z=1] - E[Y|Z=0] = 2.686 - 2.536 = 0.150*/ /*Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = 0.258 - 0.195 = 0.063 */ /*IV estimator: E[Ya=1] - E[Ya=0] = (E[Y|Z=1]-E[Y|Z=0])/(P[A=1|Z=1]-P[A=1|Z=0]) = 0.150/0.063 = 2.397*/ display &quot;Numerator, E[Y|Z=1] - E[Y|Z=0] =&quot;, 2.686 - 2.536 display &quot;Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] =&quot;, 0.258 - 0.195 display &quot;IV estimator =&quot;, 0.150/0.063 /*OPTION 2 2: automated calculation of instrument*/ /*Calculate P[A=1|Z=z], for each value of the instrument, and store in a matrix*/ quietly summarize qsmk if (highprice==0) matrix input pa = (`r(mean)&#39;) quietly summarize qsmk if (highprice==1) matrix pa = (pa ,`r(mean)&#39;) matrix list pa /*Calculate P[Y|Z=z], for each value of the instrument, and store in a second matrix*/ quietly summarize wt82_71 if (highprice==0) matrix input ey = (`r(mean)&#39;) quietly summarize wt82_71 if (highprice==1) matrix ey = (ey ,`r(mean)&#39;) matrix list ey /*Using Stata&#39;s built-in matrix manipulation feature (Mata), calculate numerator, denominator and IV estimator*/ *Numerator: num = E[Y|Z=1] - E[Y|Z=0]*mata *Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0]* *IV estimator: iv_est = IV estimate of E[Ya=1] - E[Ya=0] * mata pa = st_matrix(&quot;pa&quot;) ey = st_matrix(&quot;ey&quot;) num = ey[1,2] - ey[1,1] denom = pa[1,2] - pa[1,1] iv_est = num / denom num denom st_numscalar(&quot;iv_est&quot;, iv_est) end di scalar(iv_est) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- price82 | 1,476 1.805989 .1301703 1.451904 2.103027 (0 observations deleted) (90 observations deleted) file ./data/nhefs-highprice.dta saved +----------------+ | Key | |----------------| | frequency | | row percentage | +----------------+ | quit smoking between | baseline and 1982 highprice | No smokin Smoking c | Total -----------+----------------------+---------- 0 | 33 8 | 41 | 80.49 19.51 | 100.00 -----------+----------------------+---------- 1 | 1,065 370 | 1,435 | 74.22 25.78 | 100.00 -----------+----------------------+---------- Total | 1,098 378 | 1,476 | 74.39 25.61 | 100.00 Two-sample t test with equal variances ------------------------------------------------------------------------------ Group | Obs Mean Std. err. Std. dev. [95% conf. interval] ---------+-------------------------------------------------------------------- 0 | 41 2.535729 1.461629 9.358993 -.4183336 5.489792 1 | 1,435 2.686018 .2084888 7.897848 2.277042 3.094994 ---------+-------------------------------------------------------------------- Combined | 1,476 2.681843 .2066282 7.938395 2.276527 3.087159 ---------+-------------------------------------------------------------------- diff | -.1502887 1.257776 -2.617509 2.316932 ------------------------------------------------------------------------------ diff = mean(0) - mean(1) t = -0.1195 H0: diff = 0 Degrees of freedom = 1474 Ha: diff &lt; 0 Ha: diff != 0 Ha: diff &gt; 0 Pr(T &lt; t) = 0.4525 Pr(|T| &gt; |t|) = 0.9049 Pr(T &gt; t) = 0.5475 Numerator, E[Y|Z=1] - E[Y|Z=0] = .15 Denominator: denom = P[A=1|Z=1] - P[A=1|Z=0] = .063 IV estimator = 2.3809524 pa[1,2] c1 c2 r1 .19512195 .25783972 ey[1,2] c1 c2 r1 2.535729 2.6860178 ------------------------------------------------- mata (type end to exit) ------------ : pa = st_matrix(&quot;pa&quot;) : ey = st_matrix(&quot;ey&quot;) : num = ey[1,2] - ey[1,1] : denom = pa[1,2] - pa[1,1] : iv_est = num / denom : num .1502887173 : denom .06271777 : st_numscalar(&quot;iv_est&quot;, iv_est) : end -------------------------------------------------------------------------------------- 2.3962701 Program 16.2 Estimating the average causal effect using the standard IV estimator via two-stage-least-squares regression Data from NHEFS Section 16.2 use ./data/nhefs-highprice, clear /* ivregress fits the model in two stages: - first model: qsmk = highprice - second model: wt82_71 = predicted_qsmk */ ivregress 2sls wt82_71 (qsmk = highprice) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.01 Prob &gt; chi2 = 0.9038 R-squared = 0.0213 Root MSE = 7.8508 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 2.39627 19.82659 0.12 0.904 -36.46313 41.25567 _cons | 2.068164 5.081652 0.41 0.684 -7.89169 12.02802 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice Program 16.3 Estimating the average causal effect using the standard IV estimator via an additive marginal structural model Data from NHEFS Checking one possible value of psi. See Chapter 14 for program that checks several values and computes 95% confidence intervals Section 16.2 use ./data/nhefs-highprice, clear gen psi = 2.396 gen hspi = wt82_71 - psi*qsmk logit highprice hspi Iteration 0: Log likelihood = -187.34948 Iteration 1: Log likelihood = -187.34948 Logistic regression Number of obs = 1,476 LR chi2(1) = 0.00 Prob &gt; chi2 = 1.0000 Log likelihood = -187.34948 Pseudo R2 = 0.0000 ------------------------------------------------------------------------------ highprice | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- hspi | 2.75e-07 .0201749 0.00 1.000 -.0395419 .0395424 _cons | 3.555347 .1637931 21.71 0.000 3.234319 3.876376 ------------------------------------------------------------------------------ Program 16.4 Estimating the average causal effect using the standard IV estimator based on alternative proposed instruments Data from NHEFS Section 16.5 use ./data/nhefs-highprice, clear /*Instrument cut-point: 1.6*/ replace highprice = . replace highprice = (price82 &gt;1.6 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.7*/ replace highprice = . replace highprice = (price82 &gt;1.7 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.8*/ replace highprice = . replace highprice = (price82 &gt;1.8 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) /*Instrument cut-point: 1.9*/ replace highprice = . replace highprice = (price82 &gt;1.9 &amp; price82 &lt; .) ivregress 2sls wt82_71 (qsmk = highprice) (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.06 Prob &gt; chi2 = 0.8023 R-squared = . Root MSE = 18.593 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | 41.28124 164.8417 0.25 0.802 -281.8026 364.365 _cons | -7.890182 42.21833 -0.19 0.852 -90.63659 74.85623 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.05 Prob &gt; chi2 = 0.8274 R-squared = . Root MSE = 20.577 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -40.91185 187.6162 -0.22 0.827 -408.6328 326.8091 _cons | 13.15927 48.05103 0.27 0.784 -81.01901 107.3375 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.55 Prob &gt; chi2 = 0.4576 R-squared = . Root MSE = 13.01 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -21.10342 28.40885 -0.74 0.458 -76.78374 34.57691 _cons | 8.086377 7.283314 1.11 0.267 -6.188657 22.36141 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(1) = 0.29 Prob &gt; chi2 = 0.5880 R-squared = . Root MSE = 10.357 ------------------------------------------------------------------------------ wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- qsmk | -12.81141 23.65099 -0.54 0.588 -59.16649 33.54368 _cons | 5.962813 6.062956 0.98 0.325 -5.920362 17.84599 ------------------------------------------------------------------------------ Endogenous: qsmk Exogenous: highprice Program 16.5 Estimating the average causal effect using the standard IV estimator conditional on baseline covariates Data from NHEFS Section 16.5 use ./data/nhefs-highprice, clear replace highprice = . replace highprice = (price82 &gt;1.5 &amp; price82 &lt; .) ivregress 2sls wt82_71 sex race c.age c.smokeintensity /// c.smokeyrs i.exercise i.active c.wt7 /// (qsmk = highprice) (1,476 real changes made, 1,476 to missing) (1,476 real changes made) Instrumental variables 2SLS regression Number of obs = 1,476 Wald chi2(11) = 135.18 Prob &gt; chi2 = 0.0000 R-squared = 0.0622 Root MSE = 7.6848 -------------------------------------------------------------------------------- wt82_71 | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ---------------+---------------------------------------------------------------- qsmk | -1.042295 29.86522 -0.03 0.972 -59.57705 57.49246 sex | -1.644393 2.620115 -0.63 0.530 -6.779724 3.490938 race | -.1832546 4.631443 -0.04 0.968 -9.260716 8.894207 age | -.16364 .2395678 -0.68 0.495 -.6331844 .3059043 smokeintensity | .0057669 .144911 0.04 0.968 -.2782534 .2897872 smokeyrs | .0258357 .1607639 0.16 0.872 -.2892558 .3409271 | exercise | 1 | .4987479 2.162395 0.23 0.818 -3.739469 4.736964 2 | .5818337 2.174255 0.27 0.789 -3.679628 4.843296 | active | 1 | -1.170145 .6049921 -1.93 0.053 -2.355908 .0156176 2 | -.5122842 1.303121 -0.39 0.694 -3.066355 2.041787 | wt71 | -.0979493 .036123 -2.71 0.007 -.168749 -.0271496 _cons | 17.28033 2.32589 7.43 0.000 12.72167 21.83899 -------------------------------------------------------------------------------- Endogenous: qsmk Exogenous: sex race age smokeintensity smokeyrs 1.exercise 2.exercise 1.active 2.active wt71 highprice "],["causal-survival-analysis-stata.html", "17. Causal survival analysis: Stata Program 17.1 Program 17.2 Program 17.3 Program 17.4", " 17. Causal survival analysis: Stata library(Statamarkdown) /*************************************************************** Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins Date: 10/10/2019 Author: Eleanor Murray For errors contact: ejmurray@bu.edu ***************************************************************/ Program 17.1 Nonparametric estimation of survival curves Data from NHEFS Section 17.1 use ./data/nhefs-formatted, clear /*Some preprocessing of the data*/ gen survtime = . replace survtime = 120 if death == 0 replace survtime = (yrdth - 83)*12 + modth if death ==1 * yrdth ranges from 83 to 92* tab death qsmk /*Kaplan-Meier graph of observed survival over time, by quitting smoking*/ *For now, we use the stset function in Stata* stset survtime, failure(death=1) sts graph, by(qsmk) xlabel(0(12)120) qui gr export ./figs/stata-fig-17-1.png, replace (1,566 missing values generated) (1,275 real changes made) (291 real changes made) death | between | quit smoking between 1983 and | baseline and 1982 1992 | No smokin Smoking c | Total -----------+----------------------+---------- 0 | 963 312 | 1,275 1 | 200 91 | 291 -----------+----------------------+---------- Total | 1,163 403 | 1,566 Survival-time data settings Failure event: death==1 Observed time interval: (0, survtime] Exit on or before: failure -------------------------------------------------------------------------- 1,566 total observations 0 exclusions -------------------------------------------------------------------------- 1,566 observations remaining, representing 291 failures in single-record/single-failure data 171,076 total analysis time at risk and under observation At risk from t = 0 Earliest observed entry t = 0 Last observed exit t = 120 Failure _d: death==1 Analysis time _t: survtime Program 17.2 Parametric estimation of survival curves via hazards model Data from NHEFS Section 17.1 Generates Figure 17.4 /**Create person-month dataset for survival analyses**/ /* We want our new dataset to include 1 observation per person per month alive, starting at time = 0. Individuals who survive to the end of follow-up will have 119 time points Individuals who die will have survtime - 1 time points*/ use ./data/nhefs-formatted, clear gen survtime = . replace survtime = 120 if death == 0 replace survtime = (yrdth - 83)*12 + modth if death ==1 *expand data to person-time* gen time = 0 expand survtime if time == 0 bysort seqn: replace time = _n - 1 *Create event variable* gen event = 0 replace event = 1 if time == survtime - 1 &amp; death == 1 tab event *Create time-squared variable for analyses* gen timesq = time*time *Save the dataset to your working directory for future use* qui save ./data/nhefs_surv, replace /**Hazard ratios**/ use ./data/nhefs_surv, clear *Fit a pooled logistic hazards model * logistic event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time /**Survival curves: run regression then do:**/ *Create a dataset with all time points under each treatment level* *Re-expand data with rows for all timepoints* drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 /*Create 2 copies of each subject, and set outcome to missing and treatment -- use only the newobs*/ expand 2 , generate(interv) replace qsmk = interv /*Generate predicted event and survival probabilities for each person each month in copies*/ predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k *Within copies, generate predicted survival over time* *Remember, survival is the product of conditional survival probabilities in each interval* sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 *Display 10-year standardized survival, under interventions* *Note: since time starts at 0, month 119 is 10-year survival* by interv, sort: summarize psurv if time == 119 *Graph of standardized survival over time, under interventions* /*Note, we want our graph to start at 100% survival, so add an extra time point with P(surv) = 1*/ expand 2 if time ==0, generate(newtime) replace psurv = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 /*Separate the survival probabilities to allow plotting by intervention on qsmk*/ separate psurv, by(interv) *Plot the curves* twoway (line psurv0 time2, sort) /// (line psurv1 time2, sort) if interv &gt; -1 /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) qui gr export ./figs/stata-fig-17-2.png, replace (1,566 missing values generated) (1,275 real changes made) (291 real changes made) (169,510 observations created) (169510 real changes made) (291 real changes made) event | Freq. Percent Cum. ------------+----------------------------------- 0 | 170,785 99.83 99.83 1 | 291 0.17 100.00 ------------+----------------------------------- Total | 171,076 100.00 Logistic regression Number of obs = 171,076 LR chi2(5) = 24.26 Prob &gt; chi2 = 0.0002 Log likelihood = -2134.1973 Pseudo R2 = 0.0057 ------------------------------------------------------------------------------------ event | Odds ratio Std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | 1.402527 .6000025 0.79 0.429 .6064099 3.243815 | qsmk#c.time | Smoking cessation | 1.012318 .0162153 0.76 0.445 .9810299 1.044603 | qsmk#c.time#c.time | Smoking cessation | .9998342 .0001321 -1.25 0.210 .9995753 1.000093 | time | 1.022048 .0090651 2.46 0.014 1.004434 1.039971 | c.time#c.time | .9998637 .0000699 -1.95 0.051 .9997266 1.000001 | _cons | .0007992 .0001972 -28.90 0.000 .0004927 .0012963 ------------------------------------------------------------------------------------ Note: _cons estimates baseline odds. (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8279829 0 .8279829 .8279829 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .774282 0 .774282 .774282 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- psurv0 float %9.0g psurv, interv == Original observation psurv1 float %9.0g psurv, interv == Duplicated observation Program 17.3 Estimation of survival curves via IP weighted hazards model Data from NHEFS Section 17.4 Generates Figure 17.6 use ./data/nhefs_surv, clear keep seqn event qsmk time sex race age education /// smokeintensity smkintensity82_71 smokeyrs /// exercise active wt71 preserve *Estimate weights* logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise /// ib(last).active c.wt71##c.wt71 if time == 0 predict p_qsmk, pr logit qsmk if time ==0 predict num, pr gen sw=num/p_qsmk if qsmk==1 replace sw=(1-num)/(1-p_qsmk) if qsmk==0 summarize sw *IP weighted survival by smoking cessation* logit event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time [pweight=sw] , cluster(seqn) *Create a dataset with all time points under each treatment level* *Re-expand data with rows for all timepoints* drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 /*Create 2 copies of each subject, and set outcome to missing and treatment -- use only the newobs*/ expand 2 , generate(interv) replace qsmk = interv /*Generate predicted event and survival probabilities for each person each month in copies*/ predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k *Within copies, generate predicted survival over time* /*Remember, survival is the product of conditional survival probabilities in each interval*/ sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 *Display 10-year standardized survival, under interventions* *Note: since time starts at 0, month 119 is 10-year survival* by interv, sort: summarize psurv if time == 119 quietly summarize psurv if(interv==0 &amp; time ==119) matrix input observe = (0,`r(mean)&#39;) quietly summarize psurv if(interv==1 &amp; time ==119) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\3, observe[2,2]-observe[1,2]) matrix list observe *Graph of standardized survival over time, under interventions* /*Note: since our outcome model has no covariates, we can plot psurv directly. If we had covariates we would need to stratify or average across the values*/ expand 2 if time ==0, generate(newtime) replace psurv = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 separate psurv, by(interv) twoway (line psurv0 time2, sort) /// (line psurv1 time2, sort) if interv &gt; -1 /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) qui gr export ./figs/stata-fig-17-3.png, replace *remove extra timepoint* drop if newtime == 1 drop time2 restore **Bootstraps** qui save ./data/nhefs_std1 , replace capture program drop bootipw_surv program define bootipw_surv , rclass use ./data/nhefs_std1 , clear preserve bsample, cluster(seqn) idcluster(newseqn) logit qsmk sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 if time == 0 predict p_qsmk, pr logit qsmk if time ==0 predict num, pr gen sw=num/p_qsmk if qsmk==1 replace sw=(1-num)/(1-p_qsmk) if qsmk==0 logit event qsmk qsmk#c.time qsmk#c.time#c.time /// c.time c.time#c.time [pweight=sw], cluster(newseqn) drop if time != 0 expand 120 if time ==0 bysort newseqn: replace time = _n - 1 expand 2 , generate(interv_b) replace qsmk = interv_b predict pevent_k, pr gen psurv_k = 1-pevent_k keep newseqn time qsmk interv_b psurv_k sort newseqn interv_b time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort newseqn interv_b: /// replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 drop if time != 119 bysort interv_b: egen meanS_b = mean(psurv) keep newseqn qsmk meanS_b drop if newseqn != 1 /* only need one pair */ drop newseqn return scalar boot_0 = meanS_b[1] return scalar boot_1 = meanS_b[2] return scalar boot_diff = return(boot_1) - return(boot_0) restore end set rmsg on simulate PrY_a0 = r(boot_0) PrY_a1 = r(boot_1) /// difference=r(boot_diff), reps(10) seed(1): bootipw_surv set rmsg off matrix pe = observe[1..3, 2]&#39; bstat, stat(pe) n(1629) Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -839.70016 Iteration 2: Log likelihood = -838.45045 Iteration 3: Log likelihood = -838.44842 Iteration 4: Log likelihood = -838.44842 Logistic regression Number of obs = 1,566 LR chi2(18) = 109.16 Prob &gt; chi2 = 0.0000 Log likelihood = -838.44842 Pseudo R2 = 0.0611 ----------------------------------------------------------------------------------- qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] ------------------+---------------------------------------------------------------- sex | -.5274782 .1540497 -3.42 0.001 -.82941 -.2255463 race | -.8392636 .2100668 -4.00 0.000 -1.250987 -.4275404 age | .1212052 .0512663 2.36 0.018 .0207251 .2216853 | c.age#c.age | -.0008246 .0005361 -1.54 0.124 -.0018753 .0002262 | education | 1 | -.4759606 .2262238 -2.10 0.035 -.9193511 -.0325701 2 | -.5047361 .217597 -2.32 0.020 -.9312184 -.0782538 3 | -.3895288 .1914353 -2.03 0.042 -.7647351 -.0143226 4 | -.4123596 .2772868 -1.49 0.137 -.9558318 .1311126 | smokeintensity | -.0772704 .0152499 -5.07 0.000 -.1071596 -.0473812 | c.smokeintensity#| c.smokeintensity | .0010451 .0002866 3.65 0.000 .0004835 .0016068 | smokeyrs | -.0735966 .0277775 -2.65 0.008 -.1280395 -.0191538 | c.smokeyrs#| c.smokeyrs | .0008441 .0004632 1.82 0.068 -.0000637 .0017519 | exercise | 0 | -.395704 .1872401 -2.11 0.035 -.7626878 -.0287201 1 | -.0408635 .1382674 -0.30 0.768 -.3118627 .2301357 | active | 0 | -.176784 .2149721 -0.82 0.411 -.5981215 .2445535 1 | -.1448395 .2111472 -0.69 0.493 -.5586806 .2690015 | wt71 | -.0152357 .0263161 -0.58 0.563 -.0668144 .036343 | c.wt71#c.wt71 | .0001352 .0001632 0.83 0.407 -.0001846 .000455 | _cons | -1.19407 1.398493 -0.85 0.393 -3.935066 1.546925 ----------------------------------------------------------------------------------- Iteration 0: Log likelihood = -893.02712 Iteration 1: Log likelihood = -893.02712 Logistic regression Number of obs = 1,566 LR chi2(0) = -0.00 Prob &gt; chi2 = . Log likelihood = -893.02712 Pseudo R2 = -0.0000 ------------------------------------------------------------------------------ qsmk | Coefficient Std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- _cons | -1.059822 .0578034 -18.33 0.000 -1.173114 -.946529 ------------------------------------------------------------------------------ (128,481 missing values generated) (128,481 real changes made) Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- sw | 171,076 1.000509 .2851505 .3312489 4.297662 Iteration 0: Log pseudolikelihood = -2136.3671 Iteration 1: Log pseudolikelihood = -2127.0974 Iteration 2: Log pseudolikelihood = -2126.8556 Iteration 3: Log pseudolikelihood = -2126.8554 Logistic regression Number of obs = 171,076 Wald chi2(5) = 22.74 Prob &gt; chi2 = 0.0004 Log pseudolikelihood = -2126.8554 Pseudo R2 = 0.0045 (Std. err. adjusted for 1,566 clusters in seqn) ------------------------------------------------------------------------------------ | Robust event | Coefficient std. err. z P&gt;|z| [95% conf. interval] -------------------+---------------------------------------------------------------- qsmk | -.1301273 .4186673 -0.31 0.756 -.9507002 .6904456 | qsmk#c.time | Smoking cessation | .01916 .0151318 1.27 0.205 -.0104978 .0488178 | qsmk#c.time#c.time | Smoking cessation | -.0002152 .0001213 -1.77 0.076 -.0004528 .0000225 | time | .0208179 .0077769 2.68 0.007 .0055754 .0360604 | c.time#c.time | -.0001278 .0000643 -1.99 0.047 -.0002537 -1.84e-06 | _cons | -7.038847 .2142855 -32.85 0.000 -7.458839 -6.618855 ------------------------------------------------------------------------------------ (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8161003 0 .8161003 .8161003 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8116784 0 .8116784 .8116784 observe[3,2] c1 c2 r1 0 .8161003 r2 1 .81167841 r3 3 -.00442189 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- psurv0 float %9.0g psurv, interv == Original observation psurv1 float %9.0g psurv, interv == Duplicated observation (3,132 observations deleted) 5. predict p_qsmk, pr 6. 11. 23. drop if time != 119 24. bysort interv_b: egen meanS_b = mean(psurv) 25. keep newseqn qsmk meanS_b 26. drop if newseqn != 1 /* only need one pair */ 27. r; t=0.00 6:50:11 Command: bootipw_surv PrY_a0: r(boot_0) PrY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done r; t=19.55 6:50:30 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- PrY_a0 | .8161003 .0093124 87.64 0.000 .7978484 .8343522 PrY_a1 | .8116784 .0237581 34.16 0.000 .7651133 .8582435 difference | -.0044219 .0225007 -0.20 0.844 -.0485224 .0396786 ------------------------------------------------------------------------------ Program 17.4 Estimating of survival curves via g-formula Data from NHEFS Section 17.5 Generates Figure 17.7 use ./data/nhefs_surv, clear keep seqn event qsmk time sex race age education /// smokeintensity smkintensity82_71 smokeyrs exercise /// active wt71 preserve quietly logistic event qsmk qsmk#c.time /// qsmk#c.time#c.time time c.time#c.time /// sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 , cluster(seqn) drop if time != 0 expand 120 if time ==0 bysort seqn: replace time = _n - 1 expand 2 , generate(interv) replace qsmk = interv predict pevent_k, pr gen psurv_k = 1-pevent_k keep seqn time qsmk interv psurv_k sort seqn interv time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort seqn interv: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 by interv, sort: summarize psurv if time == 119 keep qsmk interv psurv time bysort interv : egen meanS = mean(psurv) if time == 119 by interv: summarize meanS quietly summarize meanS if(qsmk==0 &amp; time ==119) matrix input observe = ( 0,`r(mean)&#39;) quietly summarize meanS if(qsmk==1 &amp; time ==119) matrix observe = (observe \\1,`r(mean)&#39;) matrix observe = (observe \\2, observe[2,2]-observe[1,2]) *Add some row/column descriptions and print results to screen* matrix rownames observe = P(Y(a=0)=1) P(Y(a=1)=1) difference matrix colnames observe = interv survival *Graph standardized survival over time, under interventions* /*Note: unlike in Program 17.3, we now have covariates so we first need to average survival across strata*/ bysort interv time : egen meanS_t = mean(psurv) *Now we can continue with the graph* expand 2 if time ==0, generate(newtime) replace meanS_t = 1 if newtime == 1 gen time2 = 0 if newtime ==1 replace time2 = time + 1 if newtime == 0 separate meanS_t, by(interv) twoway (line meanS_t0 time2, sort) /// (line meanS_t1 time2, sort) /// , ylabel(0.5(0.1)1.0) xlabel(0(12)120) /// ytitle(&quot;Survival probability&quot;) xtitle(&quot;Months of follow-up&quot;) /// legend(label(1 &quot;A=0&quot;) label(2 &quot;A=1&quot;)) gr export ./figs/stata-fig-17-4.png, replace *remove extra timepoint* drop if newtime == 1 restore *Bootstraps* qui save ./data/nhefs_std2 , replace capture program drop bootstdz_surv program define bootstdz_surv , rclass use ./data/nhefs_std2 , clear preserve bsample, cluster(seqn) idcluster(newseqn) logistic event qsmk qsmk#c.time qsmk#c.time#c.time /// time c.time#c.time /// sex race c.age##c.age ib(last).education /// c.smokeintensity##c.smokeintensity c.smkintensity82_71 /// c.smokeyrs##c.smokeyrs ib(last).exercise ib(last).active /// c.wt71##c.wt71 drop if time != 0 /*only predict on new version of data */ expand 120 if time ==0 bysort newseqn: replace time = _n - 1 expand 2 , generate(interv_b) replace qsmk = interv_b predict pevent_k, pr gen psurv_k = 1-pevent_k keep newseqn time qsmk psurv_k sort newseqn qsmk time gen _t = time + 1 gen psurv = psurv_k if _t ==1 bysort newseqn qsmk: replace psurv = psurv_k*psurv[_t-1] if _t &gt;1 drop if time != 119 /* keep only last observation */ keep newseqn qsmk psurv /* if time is in data for complete graph add time to bysort */ bysort qsmk : egen meanS_b = mean(psurv) keep newseqn qsmk meanS_b drop if newseqn != 1 /* only need one pair */ drop newseqn return scalar boot_0 = meanS_b[1] return scalar boot_1 = meanS_b[2] return scalar boot_diff = return(boot_1) - return(boot_0) restore end set rmsg on simulate PrY_a0 = r(boot_0) PrY_a1 = r(boot_1) /// difference=r(boot_diff), reps(10) seed(1): bootstdz_surv set rmsg off matrix pe = observe[1..3, 2]&#39; bstat, stat(pe) n(1629) (169,510 observations deleted) (186,354 observations created) (186354 real changes made) (187,920 observations created) (187,920 real changes made) (372,708 missing values generated) (372708 real changes made) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .8160697 .2014345 .014127 .9903372 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- psurv | 1,566 .811763 .2044758 .0123403 .9900259 (372,708 missing values generated) -------------------------------------------------------------------------------------- -&gt; interv = Original Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanS | 1,566 .8160697 0 .8160697 .8160697 -------------------------------------------------------------------------------------- -&gt; interv = Duplicat Variable | Obs Mean Std. dev. Min Max -------------+--------------------------------------------------------- meanS | 1,566 .8117629 0 .8117629 .8117629 (3,132 observations created) (3,132 real changes made) (375,840 missing values generated) (375,840 real changes made) Variable Storage Display Value name type format label Variable label -------------------------------------------------------------------------------------- meanS_t0 float %9.0g meanS_t, interv == Original observation meanS_t1 float %9.0g meanS_t, interv == Duplicated observation file /Users/tom/Documents/GitHub/cibookex-r/figs/stata-fig-17-4.png saved as PNG format (3,132 observations deleted) 5. drop if time != 0 6. /*only predict on new version of data */ r; t=0.00 6:50:38 Command: bootstdz_surv PrY_a0: r(boot_0) PrY_a1: r(boot_1) difference: r(boot_diff) Simulations (10): .........10 done r; t=23.33 6:51:02 Bootstrap results Number of obs = 1,629 Replications = 10 ------------------------------------------------------------------------------ | Observed Bootstrap Normal-based | coefficient std. err. z P&gt;|z| [95% conf. interval] -------------+---------------------------------------------------------------- PrY_a0 | .8160697 .0087193 93.59 0.000 .7989802 .8331593 PrY_a1 | .8117629 .0292177 27.78 0.000 .7544973 .8690286 difference | -.0043068 .0307674 -0.14 0.889 -.0646099 .0559963 ------------------------------------------------------------------------------ "],["session-information-stata.html", "Session information: Stata", " Session information: Stata library(Statamarkdown) For reproducibility. about StataNow/MP 18.5 for Mac (Apple Silicon) Revision 22 May 2024 Copyright 1985-2023 StataCorp LLC Total physical memory: 8.01 GB Stata license: Unlimited-user 2-core network, expiring 29 Jan 2025 Serial number: 501809305331 Licensed to: Tom Palmer University of Bristol # install.packages(&quot;sessioninfo&quot;) sessioninfo::session_info() #&gt; ─ Session info ─────────────────────────────────────────────────────────────── #&gt; setting value #&gt; version R version 4.4.1 (2024-06-14) #&gt; os macOS Sonoma 14.5 #&gt; system aarch64, darwin20 #&gt; ui X11 #&gt; language (EN) #&gt; collate en_US.UTF-8 #&gt; ctype en_US.UTF-8 #&gt; tz Europe/London #&gt; date 2024-06-16 #&gt; pandoc 3.2 @ /opt/homebrew/bin/ (via rmarkdown) #&gt; #&gt; ─ Packages ─────────────────────────────────────────────────────────────────── #&gt; package * version date (UTC) lib source #&gt; bookdown 0.39 2024-04-15 [1] CRAN (R 4.4.0) #&gt; bslib 0.7.0 2024-03-29 [1] CRAN (R 4.4.0) #&gt; cachem 1.1.0 2024-05-16 [1] CRAN (R 4.4.0) #&gt; cli 3.6.2 2023-12-11 [1] CRAN (R 4.4.0) #&gt; digest 0.6.35 2024-03-11 [1] CRAN (R 4.4.0) #&gt; evaluate 0.24.0 2024-06-10 [1] CRAN (R 4.4.0) #&gt; fastmap 1.2.0 2024-05-15 [1] CRAN (R 4.4.0) #&gt; htmltools 0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0) #&gt; jquerylib 0.1.4 2021-04-26 [1] CRAN (R 4.4.0) #&gt; jsonlite 1.8.8 2023-12-04 [1] CRAN (R 4.4.0) #&gt; knitr 1.47 2024-05-29 [1] CRAN (R 4.4.0) #&gt; lifecycle 1.0.4 2023-11-07 [1] CRAN (R 4.4.0) #&gt; R6 2.5.1 2021-08-19 [1] CRAN (R 4.4.0) #&gt; rlang 1.1.4 2024-06-04 [1] CRAN (R 4.4.0) #&gt; rmarkdown 2.27 2024-05-17 [1] CRAN (R 4.4.0) #&gt; rstudioapi 0.16.0 2024-03-24 [1] CRAN (R 4.4.0) #&gt; sass 0.4.9 2024-03-15 [1] CRAN (R 4.4.0) #&gt; sessioninfo 1.2.2 2021-12-06 [1] CRAN (R 4.4.0) #&gt; Statamarkdown * 0.9.2 2023-12-04 [1] CRAN (R 4.4.0) #&gt; xfun 0.44 2024-05-15 [1] CRAN (R 4.4.0) #&gt; yaml 2.3.8 2023-12-11 [1] CRAN (R 4.4.0) #&gt; #&gt; [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library #&gt; #&gt; ────────────────────────────────────────────────────────────────────────────── Hernán, Miguel A, and James M Robins. 2020. Causal Inference: What If. Boca Raton: Chapman &amp; Hall/CRC. "],["404.html", "Page not found", " Page not found The page you requested cannot be found (perhaps it was moved or renamed). You may want to try searching to find the page's new location, or use the table of contents to find the page you are looking for. "]]
diff --git a/docs/session-information-r.html b/docs/session-information-r.html
index 143ee48..abe8e59 100644
--- a/docs/session-information-r.html
+++ b/docs/session-information-r.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -311,47 +311,47 @@ <h1>
 <div id="session-information-r" class="section level1 unnumbered hasAnchor">
 <h1>Session information: R<a href="session-information-r.html#session-information-r" class="anchor-section" aria-label="Anchor link to header"></a></h1>
 <p>For reproducibility.</p>
-<div class="sourceCode" id="cb49"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb49-1"><a href="session-information-r.html#cb49-1" tabindex="-1"></a><span class="co"># install.packages(&quot;sessioninfo&quot;)</span></span>
-<span id="cb49-2"><a href="session-information-r.html#cb49-2" tabindex="-1"></a>sessioninfo<span class="sc">::</span><span class="fu">session_info</span>()</span>
-<span id="cb49-3"><a href="session-information-r.html#cb49-3" tabindex="-1"></a><span class="co">#&gt; ─ Session info ───────────────────────────────────────────────────────────────</span></span>
-<span id="cb49-4"><a href="session-information-r.html#cb49-4" tabindex="-1"></a><span class="co">#&gt;  setting  value</span></span>
-<span id="cb49-5"><a href="session-information-r.html#cb49-5" tabindex="-1"></a><span class="co">#&gt;  version  R version 4.4.0 (2024-04-24)</span></span>
-<span id="cb49-6"><a href="session-information-r.html#cb49-6" tabindex="-1"></a><span class="co">#&gt;  os       macOS Sonoma 14.4.1</span></span>
-<span id="cb49-7"><a href="session-information-r.html#cb49-7" tabindex="-1"></a><span class="co">#&gt;  system   aarch64, darwin20</span></span>
-<span id="cb49-8"><a href="session-information-r.html#cb49-8" tabindex="-1"></a><span class="co">#&gt;  ui       X11</span></span>
-<span id="cb49-9"><a href="session-information-r.html#cb49-9" tabindex="-1"></a><span class="co">#&gt;  language (EN)</span></span>
-<span id="cb49-10"><a href="session-information-r.html#cb49-10" tabindex="-1"></a><span class="co">#&gt;  collate  en_US.UTF-8</span></span>
-<span id="cb49-11"><a href="session-information-r.html#cb49-11" tabindex="-1"></a><span class="co">#&gt;  ctype    en_US.UTF-8</span></span>
-<span id="cb49-12"><a href="session-information-r.html#cb49-12" tabindex="-1"></a><span class="co">#&gt;  tz       Europe/London</span></span>
-<span id="cb49-13"><a href="session-information-r.html#cb49-13" tabindex="-1"></a><span class="co">#&gt;  date     2024-04-25</span></span>
-<span id="cb49-14"><a href="session-information-r.html#cb49-14" tabindex="-1"></a><span class="co">#&gt;  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)</span></span>
-<span id="cb49-15"><a href="session-information-r.html#cb49-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb49-16"><a href="session-information-r.html#cb49-16" tabindex="-1"></a><span class="co">#&gt; ─ Packages ───────────────────────────────────────────────────────────────────</span></span>
-<span id="cb49-17"><a href="session-information-r.html#cb49-17" tabindex="-1"></a><span class="co">#&gt;  package     * version date (UTC) lib source</span></span>
-<span id="cb49-18"><a href="session-information-r.html#cb49-18" tabindex="-1"></a><span class="co">#&gt;  bookdown      0.39    2024-04-15 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-19"><a href="session-information-r.html#cb49-19" tabindex="-1"></a><span class="co">#&gt;  bslib         0.7.0   2024-03-29 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-20"><a href="session-information-r.html#cb49-20" tabindex="-1"></a><span class="co">#&gt;  cachem        1.0.8   2023-05-01 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-21"><a href="session-information-r.html#cb49-21" tabindex="-1"></a><span class="co">#&gt;  cli           3.6.2   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-22"><a href="session-information-r.html#cb49-22" tabindex="-1"></a><span class="co">#&gt;  digest        0.6.35  2024-03-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-23"><a href="session-information-r.html#cb49-23" tabindex="-1"></a><span class="co">#&gt;  evaluate      0.23    2023-11-01 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-24"><a href="session-information-r.html#cb49-24" tabindex="-1"></a><span class="co">#&gt;  fastmap       1.1.1   2023-02-24 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-25"><a href="session-information-r.html#cb49-25" tabindex="-1"></a><span class="co">#&gt;  htmltools     0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-26"><a href="session-information-r.html#cb49-26" tabindex="-1"></a><span class="co">#&gt;  jquerylib     0.1.4   2021-04-26 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-27"><a href="session-information-r.html#cb49-27" tabindex="-1"></a><span class="co">#&gt;  jsonlite      1.8.8   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-28"><a href="session-information-r.html#cb49-28" tabindex="-1"></a><span class="co">#&gt;  knitr         1.46    2024-04-06 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-29"><a href="session-information-r.html#cb49-29" tabindex="-1"></a><span class="co">#&gt;  lifecycle     1.0.4   2023-11-07 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-30"><a href="session-information-r.html#cb49-30" tabindex="-1"></a><span class="co">#&gt;  R6            2.5.1   2021-08-19 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-31"><a href="session-information-r.html#cb49-31" tabindex="-1"></a><span class="co">#&gt;  rlang         1.1.3   2024-01-10 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-32"><a href="session-information-r.html#cb49-32" tabindex="-1"></a><span class="co">#&gt;  rmarkdown     2.26    2024-03-05 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-33"><a href="session-information-r.html#cb49-33" tabindex="-1"></a><span class="co">#&gt;  rstudioapi    0.16.0  2024-03-24 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-34"><a href="session-information-r.html#cb49-34" tabindex="-1"></a><span class="co">#&gt;  sass          0.4.9   2024-03-15 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-35"><a href="session-information-r.html#cb49-35" tabindex="-1"></a><span class="co">#&gt;  sessioninfo   1.2.2   2021-12-06 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-36"><a href="session-information-r.html#cb49-36" tabindex="-1"></a><span class="co">#&gt;  xfun          0.43    2024-03-25 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-37"><a href="session-information-r.html#cb49-37" tabindex="-1"></a><span class="co">#&gt;  yaml          2.3.8   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb49-38"><a href="session-information-r.html#cb49-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb49-39"><a href="session-information-r.html#cb49-39" tabindex="-1"></a><span class="co">#&gt;  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library</span></span>
-<span id="cb49-40"><a href="session-information-r.html#cb49-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb49-41"><a href="session-information-r.html#cb49-41" tabindex="-1"></a><span class="co">#&gt; ──────────────────────────────────────────────────────────────────────────────</span></span></code></pre></div>
+<div class="sourceCode" id="cb166"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb166-1"><a href="session-information-r.html#cb166-1" tabindex="-1"></a><span class="co"># install.packages(&quot;sessioninfo&quot;)</span></span>
+<span id="cb166-2"><a href="session-information-r.html#cb166-2" tabindex="-1"></a>sessioninfo<span class="sc">::</span><span class="fu">session_info</span>()</span>
+<span id="cb166-3"><a href="session-information-r.html#cb166-3" tabindex="-1"></a><span class="co">#&gt; ─ Session info ───────────────────────────────────────────────────────────────</span></span>
+<span id="cb166-4"><a href="session-information-r.html#cb166-4" tabindex="-1"></a><span class="co">#&gt;  setting  value</span></span>
+<span id="cb166-5"><a href="session-information-r.html#cb166-5" tabindex="-1"></a><span class="co">#&gt;  version  R version 4.4.1 (2024-06-14)</span></span>
+<span id="cb166-6"><a href="session-information-r.html#cb166-6" tabindex="-1"></a><span class="co">#&gt;  os       macOS Sonoma 14.5</span></span>
+<span id="cb166-7"><a href="session-information-r.html#cb166-7" tabindex="-1"></a><span class="co">#&gt;  system   aarch64, darwin20</span></span>
+<span id="cb166-8"><a href="session-information-r.html#cb166-8" tabindex="-1"></a><span class="co">#&gt;  ui       X11</span></span>
+<span id="cb166-9"><a href="session-information-r.html#cb166-9" tabindex="-1"></a><span class="co">#&gt;  language (EN)</span></span>
+<span id="cb166-10"><a href="session-information-r.html#cb166-10" tabindex="-1"></a><span class="co">#&gt;  collate  en_US.UTF-8</span></span>
+<span id="cb166-11"><a href="session-information-r.html#cb166-11" tabindex="-1"></a><span class="co">#&gt;  ctype    en_US.UTF-8</span></span>
+<span id="cb166-12"><a href="session-information-r.html#cb166-12" tabindex="-1"></a><span class="co">#&gt;  tz       Europe/London</span></span>
+<span id="cb166-13"><a href="session-information-r.html#cb166-13" tabindex="-1"></a><span class="co">#&gt;  date     2024-06-16</span></span>
+<span id="cb166-14"><a href="session-information-r.html#cb166-14" tabindex="-1"></a><span class="co">#&gt;  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)</span></span>
+<span id="cb166-15"><a href="session-information-r.html#cb166-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb166-16"><a href="session-information-r.html#cb166-16" tabindex="-1"></a><span class="co">#&gt; ─ Packages ───────────────────────────────────────────────────────────────────</span></span>
+<span id="cb166-17"><a href="session-information-r.html#cb166-17" tabindex="-1"></a><span class="co">#&gt;  package     * version date (UTC) lib source</span></span>
+<span id="cb166-18"><a href="session-information-r.html#cb166-18" tabindex="-1"></a><span class="co">#&gt;  bookdown      0.39    2024-04-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-19"><a href="session-information-r.html#cb166-19" tabindex="-1"></a><span class="co">#&gt;  bslib         0.7.0   2024-03-29 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-20"><a href="session-information-r.html#cb166-20" tabindex="-1"></a><span class="co">#&gt;  cachem        1.1.0   2024-05-16 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-21"><a href="session-information-r.html#cb166-21" tabindex="-1"></a><span class="co">#&gt;  cli           3.6.2   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-22"><a href="session-information-r.html#cb166-22" tabindex="-1"></a><span class="co">#&gt;  digest        0.6.35  2024-03-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-23"><a href="session-information-r.html#cb166-23" tabindex="-1"></a><span class="co">#&gt;  evaluate      0.24.0  2024-06-10 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-24"><a href="session-information-r.html#cb166-24" tabindex="-1"></a><span class="co">#&gt;  fastmap       1.2.0   2024-05-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-25"><a href="session-information-r.html#cb166-25" tabindex="-1"></a><span class="co">#&gt;  htmltools     0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-26"><a href="session-information-r.html#cb166-26" tabindex="-1"></a><span class="co">#&gt;  jquerylib     0.1.4   2021-04-26 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-27"><a href="session-information-r.html#cb166-27" tabindex="-1"></a><span class="co">#&gt;  jsonlite      1.8.8   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-28"><a href="session-information-r.html#cb166-28" tabindex="-1"></a><span class="co">#&gt;  knitr         1.47    2024-05-29 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-29"><a href="session-information-r.html#cb166-29" tabindex="-1"></a><span class="co">#&gt;  lifecycle     1.0.4   2023-11-07 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-30"><a href="session-information-r.html#cb166-30" tabindex="-1"></a><span class="co">#&gt;  R6            2.5.1   2021-08-19 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-31"><a href="session-information-r.html#cb166-31" tabindex="-1"></a><span class="co">#&gt;  rlang         1.1.4   2024-06-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-32"><a href="session-information-r.html#cb166-32" tabindex="-1"></a><span class="co">#&gt;  rmarkdown     2.27    2024-05-17 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-33"><a href="session-information-r.html#cb166-33" tabindex="-1"></a><span class="co">#&gt;  rstudioapi    0.16.0  2024-03-24 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-34"><a href="session-information-r.html#cb166-34" tabindex="-1"></a><span class="co">#&gt;  sass          0.4.9   2024-03-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-35"><a href="session-information-r.html#cb166-35" tabindex="-1"></a><span class="co">#&gt;  sessioninfo   1.2.2   2021-12-06 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-36"><a href="session-information-r.html#cb166-36" tabindex="-1"></a><span class="co">#&gt;  xfun          0.44    2024-05-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-37"><a href="session-information-r.html#cb166-37" tabindex="-1"></a><span class="co">#&gt;  yaml          2.3.8   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb166-38"><a href="session-information-r.html#cb166-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb166-39"><a href="session-information-r.html#cb166-39" tabindex="-1"></a><span class="co">#&gt;  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library</span></span>
+<span id="cb166-40"><a href="session-information-r.html#cb166-40" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb166-41"><a href="session-information-r.html#cb166-41" tabindex="-1"></a><span class="co">#&gt; ──────────────────────────────────────────────────────────────────────────────</span></span></code></pre></div>
 
 </div>
 
diff --git a/docs/session-information-stata.html b/docs/session-information-stata.html
index c976e5f..62cfa07 100644
--- a/docs/session-information-stata.html
+++ b/docs/session-information-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,61 +310,61 @@ <h1>
             <section class="normal" id="section-">
 <div id="session-information-stata" class="section level1 unnumbered hasAnchor">
 <h1>Session information: Stata<a href="session-information-stata.html#session-information-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb134"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb134-1"><a href="session-information-stata.html#cb134-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb251"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb251-1"><a href="session-information-stata.html#cb251-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <p>For reproducibility.</p>
-<div class="sourceCode" id="cb135"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb135-1"><a href="session-information-stata.html#cb135-1" tabindex="-1"></a>about</span></code></pre></div>
-<pre><code>Stata/MP 18.0 for Mac (Apple Silicon)
-Revision 04 Apr 2024
+<div class="sourceCode" id="cb252"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb252-1"><a href="session-information-stata.html#cb252-1" tabindex="-1"></a>about</span></code></pre></div>
+<pre><code>StataNow/MP 18.5 for Mac (Apple Silicon)
+Revision 22 May 2024
 Copyright 1985-2023 StataCorp LLC
 
-Total physical memory: 18.00 GB
+Total physical memory: 8.01 GB
 
 Stata license: Unlimited-user 2-core network, expiring 29 Jan 2025
 Serial number: 501809305331
   Licensed to: Tom Palmer
                University of Bristol</code></pre>
-<div class="sourceCode" id="cb137"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb137-1"><a href="session-information-stata.html#cb137-1" tabindex="-1"></a><span class="co"># install.packages(&quot;sessioninfo&quot;)</span></span>
-<span id="cb137-2"><a href="session-information-stata.html#cb137-2" tabindex="-1"></a>sessioninfo<span class="sc">::</span><span class="fu">session_info</span>()</span>
-<span id="cb137-3"><a href="session-information-stata.html#cb137-3" tabindex="-1"></a><span class="co">#&gt; ─ Session info ───────────────────────────────────────────────────────────────</span></span>
-<span id="cb137-4"><a href="session-information-stata.html#cb137-4" tabindex="-1"></a><span class="co">#&gt;  setting  value</span></span>
-<span id="cb137-5"><a href="session-information-stata.html#cb137-5" tabindex="-1"></a><span class="co">#&gt;  version  R version 4.4.0 (2024-04-24)</span></span>
-<span id="cb137-6"><a href="session-information-stata.html#cb137-6" tabindex="-1"></a><span class="co">#&gt;  os       macOS Sonoma 14.4.1</span></span>
-<span id="cb137-7"><a href="session-information-stata.html#cb137-7" tabindex="-1"></a><span class="co">#&gt;  system   aarch64, darwin20</span></span>
-<span id="cb137-8"><a href="session-information-stata.html#cb137-8" tabindex="-1"></a><span class="co">#&gt;  ui       X11</span></span>
-<span id="cb137-9"><a href="session-information-stata.html#cb137-9" tabindex="-1"></a><span class="co">#&gt;  language (EN)</span></span>
-<span id="cb137-10"><a href="session-information-stata.html#cb137-10" tabindex="-1"></a><span class="co">#&gt;  collate  en_US.UTF-8</span></span>
-<span id="cb137-11"><a href="session-information-stata.html#cb137-11" tabindex="-1"></a><span class="co">#&gt;  ctype    en_US.UTF-8</span></span>
-<span id="cb137-12"><a href="session-information-stata.html#cb137-12" tabindex="-1"></a><span class="co">#&gt;  tz       Europe/London</span></span>
-<span id="cb137-13"><a href="session-information-stata.html#cb137-13" tabindex="-1"></a><span class="co">#&gt;  date     2024-04-25</span></span>
-<span id="cb137-14"><a href="session-information-stata.html#cb137-14" tabindex="-1"></a><span class="co">#&gt;  pandoc   3.1.13 @ /opt/homebrew/bin/ (via rmarkdown)</span></span>
-<span id="cb137-15"><a href="session-information-stata.html#cb137-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb137-16"><a href="session-information-stata.html#cb137-16" tabindex="-1"></a><span class="co">#&gt; ─ Packages ───────────────────────────────────────────────────────────────────</span></span>
-<span id="cb137-17"><a href="session-information-stata.html#cb137-17" tabindex="-1"></a><span class="co">#&gt;  package       * version date (UTC) lib source</span></span>
-<span id="cb137-18"><a href="session-information-stata.html#cb137-18" tabindex="-1"></a><span class="co">#&gt;  bookdown        0.39    2024-04-15 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-19"><a href="session-information-stata.html#cb137-19" tabindex="-1"></a><span class="co">#&gt;  bslib           0.7.0   2024-03-29 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-20"><a href="session-information-stata.html#cb137-20" tabindex="-1"></a><span class="co">#&gt;  cachem          1.0.8   2023-05-01 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-21"><a href="session-information-stata.html#cb137-21" tabindex="-1"></a><span class="co">#&gt;  cli             3.6.2   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-22"><a href="session-information-stata.html#cb137-22" tabindex="-1"></a><span class="co">#&gt;  digest          0.6.35  2024-03-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-23"><a href="session-information-stata.html#cb137-23" tabindex="-1"></a><span class="co">#&gt;  evaluate        0.23    2023-11-01 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-24"><a href="session-information-stata.html#cb137-24" tabindex="-1"></a><span class="co">#&gt;  fastmap         1.1.1   2023-02-24 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-25"><a href="session-information-stata.html#cb137-25" tabindex="-1"></a><span class="co">#&gt;  htmltools       0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-26"><a href="session-information-stata.html#cb137-26" tabindex="-1"></a><span class="co">#&gt;  jquerylib       0.1.4   2021-04-26 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-27"><a href="session-information-stata.html#cb137-27" tabindex="-1"></a><span class="co">#&gt;  jsonlite        1.8.8   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-28"><a href="session-information-stata.html#cb137-28" tabindex="-1"></a><span class="co">#&gt;  knitr           1.46    2024-04-06 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-29"><a href="session-information-stata.html#cb137-29" tabindex="-1"></a><span class="co">#&gt;  lifecycle       1.0.4   2023-11-07 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-30"><a href="session-information-stata.html#cb137-30" tabindex="-1"></a><span class="co">#&gt;  R6              2.5.1   2021-08-19 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-31"><a href="session-information-stata.html#cb137-31" tabindex="-1"></a><span class="co">#&gt;  rlang           1.1.3   2024-01-10 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-32"><a href="session-information-stata.html#cb137-32" tabindex="-1"></a><span class="co">#&gt;  rmarkdown       2.26    2024-03-05 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-33"><a href="session-information-stata.html#cb137-33" tabindex="-1"></a><span class="co">#&gt;  rstudioapi      0.16.0  2024-03-24 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-34"><a href="session-information-stata.html#cb137-34" tabindex="-1"></a><span class="co">#&gt;  sass            0.4.9   2024-03-15 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-35"><a href="session-information-stata.html#cb137-35" tabindex="-1"></a><span class="co">#&gt;  sessioninfo     1.2.2   2021-12-06 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-36"><a href="session-information-stata.html#cb137-36" tabindex="-1"></a><span class="co">#&gt;  Statamarkdown * 0.9.2   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-37"><a href="session-information-stata.html#cb137-37" tabindex="-1"></a><span class="co">#&gt;  xfun            0.43    2024-03-25 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-38"><a href="session-information-stata.html#cb137-38" tabindex="-1"></a><span class="co">#&gt;  yaml            2.3.8   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
-<span id="cb137-39"><a href="session-information-stata.html#cb137-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb137-40"><a href="session-information-stata.html#cb137-40" tabindex="-1"></a><span class="co">#&gt;  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library</span></span>
-<span id="cb137-41"><a href="session-information-stata.html#cb137-41" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb137-42"><a href="session-information-stata.html#cb137-42" tabindex="-1"></a><span class="co">#&gt; ──────────────────────────────────────────────────────────────────────────────</span></span></code></pre></div>
+<div class="sourceCode" id="cb254"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb254-1"><a href="session-information-stata.html#cb254-1" tabindex="-1"></a><span class="co"># install.packages(&quot;sessioninfo&quot;)</span></span>
+<span id="cb254-2"><a href="session-information-stata.html#cb254-2" tabindex="-1"></a>sessioninfo<span class="sc">::</span><span class="fu">session_info</span>()</span>
+<span id="cb254-3"><a href="session-information-stata.html#cb254-3" tabindex="-1"></a><span class="co">#&gt; ─ Session info ───────────────────────────────────────────────────────────────</span></span>
+<span id="cb254-4"><a href="session-information-stata.html#cb254-4" tabindex="-1"></a><span class="co">#&gt;  setting  value</span></span>
+<span id="cb254-5"><a href="session-information-stata.html#cb254-5" tabindex="-1"></a><span class="co">#&gt;  version  R version 4.4.1 (2024-06-14)</span></span>
+<span id="cb254-6"><a href="session-information-stata.html#cb254-6" tabindex="-1"></a><span class="co">#&gt;  os       macOS Sonoma 14.5</span></span>
+<span id="cb254-7"><a href="session-information-stata.html#cb254-7" tabindex="-1"></a><span class="co">#&gt;  system   aarch64, darwin20</span></span>
+<span id="cb254-8"><a href="session-information-stata.html#cb254-8" tabindex="-1"></a><span class="co">#&gt;  ui       X11</span></span>
+<span id="cb254-9"><a href="session-information-stata.html#cb254-9" tabindex="-1"></a><span class="co">#&gt;  language (EN)</span></span>
+<span id="cb254-10"><a href="session-information-stata.html#cb254-10" tabindex="-1"></a><span class="co">#&gt;  collate  en_US.UTF-8</span></span>
+<span id="cb254-11"><a href="session-information-stata.html#cb254-11" tabindex="-1"></a><span class="co">#&gt;  ctype    en_US.UTF-8</span></span>
+<span id="cb254-12"><a href="session-information-stata.html#cb254-12" tabindex="-1"></a><span class="co">#&gt;  tz       Europe/London</span></span>
+<span id="cb254-13"><a href="session-information-stata.html#cb254-13" tabindex="-1"></a><span class="co">#&gt;  date     2024-06-16</span></span>
+<span id="cb254-14"><a href="session-information-stata.html#cb254-14" tabindex="-1"></a><span class="co">#&gt;  pandoc   3.2 @ /opt/homebrew/bin/ (via rmarkdown)</span></span>
+<span id="cb254-15"><a href="session-information-stata.html#cb254-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb254-16"><a href="session-information-stata.html#cb254-16" tabindex="-1"></a><span class="co">#&gt; ─ Packages ───────────────────────────────────────────────────────────────────</span></span>
+<span id="cb254-17"><a href="session-information-stata.html#cb254-17" tabindex="-1"></a><span class="co">#&gt;  package       * version date (UTC) lib source</span></span>
+<span id="cb254-18"><a href="session-information-stata.html#cb254-18" tabindex="-1"></a><span class="co">#&gt;  bookdown        0.39    2024-04-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-19"><a href="session-information-stata.html#cb254-19" tabindex="-1"></a><span class="co">#&gt;  bslib           0.7.0   2024-03-29 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-20"><a href="session-information-stata.html#cb254-20" tabindex="-1"></a><span class="co">#&gt;  cachem          1.1.0   2024-05-16 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-21"><a href="session-information-stata.html#cb254-21" tabindex="-1"></a><span class="co">#&gt;  cli             3.6.2   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-22"><a href="session-information-stata.html#cb254-22" tabindex="-1"></a><span class="co">#&gt;  digest          0.6.35  2024-03-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-23"><a href="session-information-stata.html#cb254-23" tabindex="-1"></a><span class="co">#&gt;  evaluate        0.24.0  2024-06-10 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-24"><a href="session-information-stata.html#cb254-24" tabindex="-1"></a><span class="co">#&gt;  fastmap         1.2.0   2024-05-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-25"><a href="session-information-stata.html#cb254-25" tabindex="-1"></a><span class="co">#&gt;  htmltools       0.5.8.1 2024-04-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-26"><a href="session-information-stata.html#cb254-26" tabindex="-1"></a><span class="co">#&gt;  jquerylib       0.1.4   2021-04-26 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-27"><a href="session-information-stata.html#cb254-27" tabindex="-1"></a><span class="co">#&gt;  jsonlite        1.8.8   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-28"><a href="session-information-stata.html#cb254-28" tabindex="-1"></a><span class="co">#&gt;  knitr           1.47    2024-05-29 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-29"><a href="session-information-stata.html#cb254-29" tabindex="-1"></a><span class="co">#&gt;  lifecycle       1.0.4   2023-11-07 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-30"><a href="session-information-stata.html#cb254-30" tabindex="-1"></a><span class="co">#&gt;  R6              2.5.1   2021-08-19 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-31"><a href="session-information-stata.html#cb254-31" tabindex="-1"></a><span class="co">#&gt;  rlang           1.1.4   2024-06-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-32"><a href="session-information-stata.html#cb254-32" tabindex="-1"></a><span class="co">#&gt;  rmarkdown       2.27    2024-05-17 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-33"><a href="session-information-stata.html#cb254-33" tabindex="-1"></a><span class="co">#&gt;  rstudioapi      0.16.0  2024-03-24 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-34"><a href="session-information-stata.html#cb254-34" tabindex="-1"></a><span class="co">#&gt;  sass            0.4.9   2024-03-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-35"><a href="session-information-stata.html#cb254-35" tabindex="-1"></a><span class="co">#&gt;  sessioninfo     1.2.2   2021-12-06 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-36"><a href="session-information-stata.html#cb254-36" tabindex="-1"></a><span class="co">#&gt;  Statamarkdown * 0.9.2   2023-12-04 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-37"><a href="session-information-stata.html#cb254-37" tabindex="-1"></a><span class="co">#&gt;  xfun            0.44    2024-05-15 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-38"><a href="session-information-stata.html#cb254-38" tabindex="-1"></a><span class="co">#&gt;  yaml            2.3.8   2023-12-11 [1] CRAN (R 4.4.0)</span></span>
+<span id="cb254-39"><a href="session-information-stata.html#cb254-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb254-40"><a href="session-information-stata.html#cb254-40" tabindex="-1"></a><span class="co">#&gt;  [1] /Library/Frameworks/R.framework/Versions/4.4-arm64/Resources/library</span></span>
+<span id="cb254-41"><a href="session-information-stata.html#cb254-41" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb254-42"><a href="session-information-stata.html#cb254-42" tabindex="-1"></a><span class="co">#&gt; ──────────────────────────────────────────────────────────────────────────────</span></span></code></pre></div>
 
 <div id="refs" class="references csl-bib-body hanging-indent" entry-spacing="0">
 <div class="csl-entry">
diff --git a/docs/standardization-and-the-parametric-g-formula-stata.html b/docs/standardization-and-the-parametric-g-formula-stata.html
index cc6a58d..c03dba6 100644
--- a/docs/standardization-and-the-parametric-g-formula-stata.html
+++ b/docs/standardization-and-the-parametric-g-formula-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,7 +310,7 @@ <h1>
             <section class="normal" id="section-">
 <div id="standardization-and-the-parametric-g-formula-stata" class="section level1 unnumbered hasAnchor">
 <h1>13. Standardization and the parametric G-formula: Stata<a href="standardization-and-the-parametric-g-formula-stata.html#standardization-and-the-parametric-g-formula-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb84"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb84-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb84-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb201"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb201-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb201-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
 <pre><code>/***************************************************************
 Stata code for Causal Inference: What If by Miguel Hernan &amp; Jamie Robins
 Date: 10/10/2019
@@ -323,22 +323,22 @@ <h2>Program 13.1<a href="standardization-and-the-parametric-g-formula-stata.html
 <li>Estimating the mean outcome within levels of treatment and confounders: Data from NHEFS</li>
 <li>Section 13.2</li>
 </ul>
-<div class="sourceCode" id="cb86"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb86-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb86-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-2" tabindex="-1"></a></span>
-<span id="cb86-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-3" tabindex="-1"></a><span class="co">/* Estimate the the conditional mean outcome within strata of quitting </span></span>
-<span id="cb86-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-4" tabindex="-1"></a><span class="co">smoking and covariates, among the uncensored */</span></span>
-<span id="cb86-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-5" tabindex="-1"></a><span class="kw">glm</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb86-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-6" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb86-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-7" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
-<span id="cb86-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-8" tabindex="-1"></a>  qsmk##c.smokeintensity</span>
-<span id="cb86-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-9" tabindex="-1"></a><span class="kw">predict</span> meanY</span>
-<span id="cb86-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-10" tabindex="-1"></a><span class="kw">summarize</span> meanY</span>
-<span id="cb86-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-11" tabindex="-1"></a></span>
-<span id="cb86-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-12" tabindex="-1"></a><span class="co">/*Look at the predicted value for subject ID = 24770*/</span></span>
-<span id="cb86-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-13" tabindex="-1"></a><span class="ot">list</span> meanY <span class="kw">if</span> seqn == 24770</span>
-<span id="cb86-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-14" tabindex="-1"></a></span>
-<span id="cb86-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-15" tabindex="-1"></a><span class="co">/*Observed mean outcome for comparison */</span></span>
-<span id="cb86-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb86-16" tabindex="-1"></a><span class="kw">summarize</span> wt82_71</span></code></pre></div>
+<div class="sourceCode" id="cb203"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb203-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb203-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-2" tabindex="-1"></a></span>
+<span id="cb203-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-3" tabindex="-1"></a><span class="co">/* Estimate the the conditional mean outcome within strata of quitting </span></span>
+<span id="cb203-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-4" tabindex="-1"></a><span class="co">smoking and covariates, among the uncensored */</span></span>
+<span id="cb203-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-5" tabindex="-1"></a><span class="kw">glm</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb203-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-6" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb203-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-7" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
+<span id="cb203-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-8" tabindex="-1"></a>  qsmk##c.smokeintensity</span>
+<span id="cb203-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-9" tabindex="-1"></a><span class="kw">predict</span> meanY</span>
+<span id="cb203-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-10" tabindex="-1"></a><span class="kw">summarize</span> meanY</span>
+<span id="cb203-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-11" tabindex="-1"></a></span>
+<span id="cb203-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-12" tabindex="-1"></a><span class="co">/*Look at the predicted value for subject ID = 24770*/</span></span>
+<span id="cb203-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-13" tabindex="-1"></a><span class="ot">list</span> meanY <span class="kw">if</span> seqn == 24770</span>
+<span id="cb203-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-14" tabindex="-1"></a></span>
+<span id="cb203-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-15" tabindex="-1"></a><span class="co">/*Observed mean outcome for comparison */</span></span>
+<span id="cb203-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb203-16" tabindex="-1"></a><span class="kw">summarize</span> wt82_71</span></code></pre></div>
 <pre><code>note: 1.qsmk omitted because of collinearity.
 note: smokeintensity omitted because of collinearity.
 
@@ -429,107 +429,107 @@ <h2>Program 13.2<a href="standardization-and-the-parametric-g-formula-stata.html
 <li>Data from Table 2.2</li>
 <li>Section 13.3</li>
 </ul>
-<div class="sourceCode" id="cb88"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb88-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-1" tabindex="-1"></a><span class="kw">clear</span></span>
-<span id="cb88-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-2" tabindex="-1"></a>input str10 ID L A Y</span>
-<span id="cb88-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-3" tabindex="-1"></a><span class="st">&quot;Rheia&quot;</span>     0 0 0 </span>
-<span id="cb88-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-4" tabindex="-1"></a><span class="st">&quot;Kronos&quot;</span>    0 0 1 </span>
-<span id="cb88-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-5" tabindex="-1"></a><span class="st">&quot;Demeter&quot;</span>   0 0 0 </span>
-<span id="cb88-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-6" tabindex="-1"></a><span class="st">&quot;Hades&quot;</span>     0 0 0 </span>
-<span id="cb88-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-7" tabindex="-1"></a><span class="st">&quot;Hestia&quot;</span>    0 1 0 </span>
-<span id="cb88-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-8" tabindex="-1"></a><span class="st">&quot;Poseidon&quot;</span>  0 1 0 </span>
-<span id="cb88-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-9" tabindex="-1"></a><span class="st">&quot;Hera&quot;</span>      0 1 0 </span>
-<span id="cb88-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-10" tabindex="-1"></a><span class="st">&quot;Zeus&quot;</span>      0 1 1 </span>
-<span id="cb88-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-11" tabindex="-1"></a><span class="st">&quot;Artemis&quot;</span>   1 0 1</span>
-<span id="cb88-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-12" tabindex="-1"></a><span class="st">&quot;Apollo&quot;</span>    1 0 1</span>
-<span id="cb88-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-13" tabindex="-1"></a><span class="st">&quot;Leto&quot;</span>      1 0 0</span>
-<span id="cb88-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-14" tabindex="-1"></a><span class="st">&quot;Ares&quot;</span>      1 1 1</span>
-<span id="cb88-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-15" tabindex="-1"></a><span class="st">&quot;Athena&quot;</span>    1 1 1</span>
-<span id="cb88-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-16" tabindex="-1"></a><span class="st">&quot;Hephaestus&quot;</span> 1 1 1</span>
-<span id="cb88-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-17" tabindex="-1"></a><span class="st">&quot;Aphrodite&quot;</span> 1 1 1</span>
-<span id="cb88-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-18" tabindex="-1"></a><span class="st">&quot;Cyclope&quot;</span>   1 1 1</span>
-<span id="cb88-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-19" tabindex="-1"></a><span class="st">&quot;Persephone&quot;</span> 1 1 1</span>
-<span id="cb88-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-20" tabindex="-1"></a><span class="st">&quot;Hermes&quot;</span>    1 1 0</span>
-<span id="cb88-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-21" tabindex="-1"></a><span class="st">&quot;Hebe&quot;</span>      1 1 0</span>
-<span id="cb88-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-22" tabindex="-1"></a><span class="st">&quot;Dionysus&quot;</span>  1 1 0 </span>
-<span id="cb88-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-23" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb88-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-24" tabindex="-1"></a></span>
-<span id="cb88-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-25" tabindex="-1"></a><span class="co">/* i. Data set up for standardization: </span></span>
-<span id="cb88-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-26" tabindex="-1"></a><span class="co"> - create 3 copies of each subject first, </span></span>
-<span id="cb88-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-27" tabindex="-1"></a><span class="co"> - duplicate the dataset and create a variable `interv` which indicates</span></span>
-<span id="cb88-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-28" tabindex="-1"></a><span class="co">which copy is the duplicate (interv =1) */</span></span>
-<span id="cb88-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-29" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
-<span id="cb88-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-30" tabindex="-1"></a></span>
-<span id="cb88-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-31" tabindex="-1"></a><span class="co">/* Next, duplicate the original copy (interv = 0) again, and create</span></span>
-<span id="cb88-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-32" tabindex="-1"></a><span class="co">another variable &#39;interv2&#39; to indicate the copy */</span></span>
-<span id="cb88-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-33" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
-<span id="cb88-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-34" tabindex="-1"></a></span>
-<span id="cb88-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-35" tabindex="-1"></a><span class="co">/* Now, change the value of &#39;interv&#39; to -1 in one of the copies so that</span></span>
-<span id="cb88-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-36" tabindex="-1"></a><span class="co">there are unique values of interv for each copy */</span></span>
-<span id="cb88-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-37" tabindex="-1"></a><span class="kw">replace</span> interv = -1  <span class="kw">if</span> interv2 ==1</span>
-<span id="cb88-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-38" tabindex="-1"></a><span class="kw">drop</span> interv2</span>
-<span id="cb88-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-39" tabindex="-1"></a></span>
-<span id="cb88-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-40" tabindex="-1"></a><span class="co">/* Check that the data has the structure you want: </span></span>
-<span id="cb88-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-41" tabindex="-1"></a><span class="co"> - there should be 1566 people in each of the 3 levels of interv*/</span></span>
-<span id="cb88-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-42" tabindex="-1"></a><span class="kw">tab</span> interv</span>
-<span id="cb88-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-43" tabindex="-1"></a></span>
-<span id="cb88-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-44" tabindex="-1"></a><span class="co">/* Two of the copies will be for computing the standardized result</span></span>
-<span id="cb88-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-45" tabindex="-1"></a><span class="co">for these two copies (interv = 0 and interv = 1), set the outcome to</span></span>
-<span id="cb88-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-46" tabindex="-1"></a><span class="co">missing and force qsmk to either 0 or 1, respectively.</span></span>
-<span id="cb88-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-47" tabindex="-1"></a><span class="co">You may need to edit this part of the code for your outcome and exposure variables */</span></span>
-<span id="cb88-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-48" tabindex="-1"></a><span class="kw">replace</span> Y = . <span class="kw">if</span> interv != -1</span>
-<span id="cb88-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-49" tabindex="-1"></a><span class="kw">replace</span> A = 0 <span class="kw">if</span> interv == 0</span>
-<span id="cb88-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-50" tabindex="-1"></a><span class="kw">replace</span> A = 1 <span class="kw">if</span> interv == 1</span>
-<span id="cb88-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-51" tabindex="-1"></a></span>
-<span id="cb88-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-52" tabindex="-1"></a><span class="co">/* Check that the data has the structure you want: </span></span>
-<span id="cb88-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-53" tabindex="-1"></a><span class="co">for interv = -1, some people quit and some do not; </span></span>
-<span id="cb88-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-54" tabindex="-1"></a><span class="co">for interv = 0 or 1, noone quits or everyone quits, respectively */</span></span>
-<span id="cb88-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-55" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> A</span>
-<span id="cb88-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-56" tabindex="-1"></a></span>
-<span id="cb88-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-57" tabindex="-1"></a>*ii.Estimation <span class="kw">in</span> original <span class="kw">sample</span>*</span>
-<span id="cb88-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-58" tabindex="-1"></a>*Now, we <span class="kw">do</span> a parametric regression with the covariates we want to <span class="kw">adjust</span> <span class="kw">for</span>*</span>
-<span id="cb88-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-59" tabindex="-1"></a>*You may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> the variables you want.*</span>
-<span id="cb88-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-60" tabindex="-1"></a>*Because the copies have <span class="fu">missing</span> Y, <span class="kw">this</span> will only <span class="kw">run</span> the regression <span class="kw">in</span> the</span>
-<span id="cb88-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-61" tabindex="-1"></a>*original copy.*</span>
-<span id="cb88-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-62" tabindex="-1"></a>*The <span class="kw">double</span> hash between A &amp; L creates a regression <span class="kw">model</span> with A and L and a </span>
-<span id="cb88-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-63" tabindex="-1"></a>* product term between A and L*</span>
-<span id="cb88-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-64" tabindex="-1"></a><span class="kw">regress</span> Y A##L</span>
-<span id="cb88-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-65" tabindex="-1"></a></span>
-<span id="cb88-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-66" tabindex="-1"></a>*Ask Stata <span class="kw">for</span> expected <span class="kw">values</span> - Stata will give you expected <span class="kw">values</span> <span class="kw">for</span> <span class="ot">all</span> </span>
-<span id="cb88-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-67" tabindex="-1"></a>* copies, <span class="kw">not</span> just the original ones*</span>
-<span id="cb88-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-68" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
-<span id="cb88-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-69" tabindex="-1"></a></span>
-<span id="cb88-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-70" tabindex="-1"></a>*Now ask <span class="kw">for</span> a summary <span class="kw">of</span> these <span class="kw">values</span> <span class="kw">by</span> intervention*</span>
-<span id="cb88-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-71" tabindex="-1"></a>*These are the standardized outcome <span class="kw">estimates</span>: you can subtract them to <span class="fu">get</span> the</span>
-<span id="cb88-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-72" tabindex="-1"></a>* standardized difference*</span>
-<span id="cb88-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-73" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
-<span id="cb88-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-74" tabindex="-1"></a></span>
-<span id="cb88-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-75" tabindex="-1"></a>*iii.OPTIONAL: Output standardized point <span class="kw">estimates</span> and difference*</span>
-<span id="cb88-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-76" tabindex="-1"></a>*The summary from the <span class="fu">last</span> command gives you the standardized <span class="kw">estimates</span>*</span>
-<span id="cb88-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-77" tabindex="-1"></a>*We can stop there, <span class="kw">or</span> we can ask Stata to calculate the standardized difference</span>
-<span id="cb88-78"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-78" tabindex="-1"></a>* and <span class="kw">display</span> <span class="ot">all</span> the results <span class="kw">in</span> a simple <span class="kw">table</span>*</span>
-<span id="cb88-79"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-79" tabindex="-1"></a>*The code below can <span class="kw">be</span> used <span class="kw">as</span>-is without changing any <span class="kw">variable</span> names*</span>
-<span id="cb88-80"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-80" tabindex="-1"></a>*The option <span class="st">&quot;quietly&quot;</span> asks Stata <span class="kw">not</span> to <span class="kw">display</span> the output <span class="kw">of</span> some intermediate</span>
-<span id="cb88-81"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-81" tabindex="-1"></a>* calculations*</span>
-<span id="cb88-82"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-82" tabindex="-1"></a>*You can <span class="kw">delete</span> <span class="kw">this</span> option <span class="kw">if</span> you want to see what is happening step-<span class="kw">by</span>-step*</span>
-<span id="cb88-83"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-83" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
-<span id="cb88-84"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-84" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb88-85"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-85" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
-<span id="cb88-86"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-86" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb88-87"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-87" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
-<span id="cb88-88"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-88" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb88-89"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-89" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
-<span id="cb88-90"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-90" tabindex="-1"></a></span>
-<span id="cb88-91"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-91" tabindex="-1"></a>*Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen*</span>
-<span id="cb88-92"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-92" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
-<span id="cb88-93"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-93" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
-<span id="cb88-94"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-94" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
-<span id="cb88-95"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-95" tabindex="-1"></a></span>
-<span id="cb88-96"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-96" tabindex="-1"></a>*to interpret these results:*</span>
-<span id="cb88-97"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-97" tabindex="-1"></a>*<span class="ot">row</span> 1, column 2, is the observed <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">in</span> our original <span class="kw">sample</span>*</span>
-<span id="cb88-98"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-98" tabindex="-1"></a>*<span class="ot">row</span> 2, column 2, is the <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">if</span> everyone had <span class="kw">not</span> quit smoking*</span>
-<span id="cb88-99"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-99" tabindex="-1"></a>*<span class="ot">row</span> 3, column 2, is the <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">if</span> everyone had quit smoking*</span>
-<span id="cb88-100"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-100" tabindex="-1"></a>*<span class="ot">row</span> 4, column 2, is the <span class="kw">mean</span> difference outcome <span class="ot">value</span> <span class="kw">if</span> everyone had quit </span>
-<span id="cb88-101"><a href="standardization-and-the-parametric-g-formula-stata.html#cb88-101" tabindex="-1"></a>* smoking compared to <span class="kw">if</span> everyone had <span class="kw">not</span> quit smoking*</span></code></pre></div>
+<div class="sourceCode" id="cb205"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb205-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-1" tabindex="-1"></a><span class="kw">clear</span></span>
+<span id="cb205-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-2" tabindex="-1"></a>input str10 ID L A Y</span>
+<span id="cb205-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-3" tabindex="-1"></a><span class="st">&quot;Rheia&quot;</span>     0 0 0 </span>
+<span id="cb205-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-4" tabindex="-1"></a><span class="st">&quot;Kronos&quot;</span>    0 0 1 </span>
+<span id="cb205-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-5" tabindex="-1"></a><span class="st">&quot;Demeter&quot;</span>   0 0 0 </span>
+<span id="cb205-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-6" tabindex="-1"></a><span class="st">&quot;Hades&quot;</span>     0 0 0 </span>
+<span id="cb205-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-7" tabindex="-1"></a><span class="st">&quot;Hestia&quot;</span>    0 1 0 </span>
+<span id="cb205-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-8" tabindex="-1"></a><span class="st">&quot;Poseidon&quot;</span>  0 1 0 </span>
+<span id="cb205-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-9" tabindex="-1"></a><span class="st">&quot;Hera&quot;</span>      0 1 0 </span>
+<span id="cb205-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-10" tabindex="-1"></a><span class="st">&quot;Zeus&quot;</span>      0 1 1 </span>
+<span id="cb205-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-11" tabindex="-1"></a><span class="st">&quot;Artemis&quot;</span>   1 0 1</span>
+<span id="cb205-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-12" tabindex="-1"></a><span class="st">&quot;Apollo&quot;</span>    1 0 1</span>
+<span id="cb205-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-13" tabindex="-1"></a><span class="st">&quot;Leto&quot;</span>      1 0 0</span>
+<span id="cb205-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-14" tabindex="-1"></a><span class="st">&quot;Ares&quot;</span>      1 1 1</span>
+<span id="cb205-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-15" tabindex="-1"></a><span class="st">&quot;Athena&quot;</span>    1 1 1</span>
+<span id="cb205-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-16" tabindex="-1"></a><span class="st">&quot;Hephaestus&quot;</span> 1 1 1</span>
+<span id="cb205-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-17" tabindex="-1"></a><span class="st">&quot;Aphrodite&quot;</span> 1 1 1</span>
+<span id="cb205-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-18" tabindex="-1"></a><span class="st">&quot;Cyclope&quot;</span>   1 1 1</span>
+<span id="cb205-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-19" tabindex="-1"></a><span class="st">&quot;Persephone&quot;</span> 1 1 1</span>
+<span id="cb205-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-20" tabindex="-1"></a><span class="st">&quot;Hermes&quot;</span>    1 1 0</span>
+<span id="cb205-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-21" tabindex="-1"></a><span class="st">&quot;Hebe&quot;</span>      1 1 0</span>
+<span id="cb205-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-22" tabindex="-1"></a><span class="st">&quot;Dionysus&quot;</span>  1 1 0 </span>
+<span id="cb205-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-23" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb205-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-24" tabindex="-1"></a></span>
+<span id="cb205-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-25" tabindex="-1"></a><span class="co">/* i. Data set up for standardization: </span></span>
+<span id="cb205-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-26" tabindex="-1"></a><span class="co"> - create 3 copies of each subject first, </span></span>
+<span id="cb205-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-27" tabindex="-1"></a><span class="co"> - duplicate the dataset and create a variable `interv` which indicates</span></span>
+<span id="cb205-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-28" tabindex="-1"></a><span class="co">which copy is the duplicate (interv =1) */</span></span>
+<span id="cb205-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-29" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
+<span id="cb205-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-30" tabindex="-1"></a></span>
+<span id="cb205-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-31" tabindex="-1"></a><span class="co">/* Next, duplicate the original copy (interv = 0) again, and create</span></span>
+<span id="cb205-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-32" tabindex="-1"></a><span class="co">another variable &#39;interv2&#39; to indicate the copy */</span></span>
+<span id="cb205-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-33" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
+<span id="cb205-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-34" tabindex="-1"></a></span>
+<span id="cb205-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-35" tabindex="-1"></a><span class="co">/* Now, change the value of &#39;interv&#39; to -1 in one of the copies so that</span></span>
+<span id="cb205-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-36" tabindex="-1"></a><span class="co">there are unique values of interv for each copy */</span></span>
+<span id="cb205-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-37" tabindex="-1"></a><span class="kw">replace</span> interv = -1  <span class="kw">if</span> interv2 ==1</span>
+<span id="cb205-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-38" tabindex="-1"></a><span class="kw">drop</span> interv2</span>
+<span id="cb205-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-39" tabindex="-1"></a></span>
+<span id="cb205-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-40" tabindex="-1"></a><span class="co">/* Check that the data has the structure you want: </span></span>
+<span id="cb205-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-41" tabindex="-1"></a><span class="co"> - there should be 1566 people in each of the 3 levels of interv*/</span></span>
+<span id="cb205-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-42" tabindex="-1"></a><span class="kw">tab</span> interv</span>
+<span id="cb205-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-43" tabindex="-1"></a></span>
+<span id="cb205-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-44" tabindex="-1"></a><span class="co">/* Two of the copies will be for computing the standardized result</span></span>
+<span id="cb205-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-45" tabindex="-1"></a><span class="co">for these two copies (interv = 0 and interv = 1), set the outcome to</span></span>
+<span id="cb205-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-46" tabindex="-1"></a><span class="co">missing and force qsmk to either 0 or 1, respectively.</span></span>
+<span id="cb205-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-47" tabindex="-1"></a><span class="co">You may need to edit this part of the code for your outcome and exposure variables */</span></span>
+<span id="cb205-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-48" tabindex="-1"></a><span class="kw">replace</span> Y = . <span class="kw">if</span> interv != -1</span>
+<span id="cb205-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-49" tabindex="-1"></a><span class="kw">replace</span> A = 0 <span class="kw">if</span> interv == 0</span>
+<span id="cb205-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-50" tabindex="-1"></a><span class="kw">replace</span> A = 1 <span class="kw">if</span> interv == 1</span>
+<span id="cb205-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-51" tabindex="-1"></a></span>
+<span id="cb205-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-52" tabindex="-1"></a><span class="co">/* Check that the data has the structure you want: </span></span>
+<span id="cb205-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-53" tabindex="-1"></a><span class="co">for interv = -1, some people quit and some do not; </span></span>
+<span id="cb205-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-54" tabindex="-1"></a><span class="co">for interv = 0 or 1, noone quits or everyone quits, respectively */</span></span>
+<span id="cb205-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-55" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> A</span>
+<span id="cb205-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-56" tabindex="-1"></a></span>
+<span id="cb205-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-57" tabindex="-1"></a>*ii.Estimation <span class="kw">in</span> original <span class="kw">sample</span>*</span>
+<span id="cb205-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-58" tabindex="-1"></a>*Now, we <span class="kw">do</span> a parametric regression with the covariates we want to <span class="kw">adjust</span> <span class="kw">for</span>*</span>
+<span id="cb205-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-59" tabindex="-1"></a>*You may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> the variables you want.*</span>
+<span id="cb205-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-60" tabindex="-1"></a>*Because the copies have <span class="fu">missing</span> Y, <span class="kw">this</span> will only <span class="kw">run</span> the regression <span class="kw">in</span> the</span>
+<span id="cb205-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-61" tabindex="-1"></a>*original copy.*</span>
+<span id="cb205-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-62" tabindex="-1"></a>*The <span class="kw">double</span> hash between A &amp; L creates a regression <span class="kw">model</span> with A and L and a </span>
+<span id="cb205-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-63" tabindex="-1"></a>* product term between A and L*</span>
+<span id="cb205-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-64" tabindex="-1"></a><span class="kw">regress</span> Y A##L</span>
+<span id="cb205-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-65" tabindex="-1"></a></span>
+<span id="cb205-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-66" tabindex="-1"></a>*Ask Stata <span class="kw">for</span> expected <span class="kw">values</span> - Stata will give you expected <span class="kw">values</span> <span class="kw">for</span> <span class="ot">all</span> </span>
+<span id="cb205-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-67" tabindex="-1"></a>* copies, <span class="kw">not</span> just the original ones*</span>
+<span id="cb205-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-68" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
+<span id="cb205-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-69" tabindex="-1"></a></span>
+<span id="cb205-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-70" tabindex="-1"></a>*Now ask <span class="kw">for</span> a summary <span class="kw">of</span> these <span class="kw">values</span> <span class="kw">by</span> intervention*</span>
+<span id="cb205-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-71" tabindex="-1"></a>*These are the standardized outcome <span class="kw">estimates</span>: you can subtract them to <span class="fu">get</span> the</span>
+<span id="cb205-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-72" tabindex="-1"></a>* standardized difference*</span>
+<span id="cb205-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-73" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
+<span id="cb205-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-74" tabindex="-1"></a></span>
+<span id="cb205-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-75" tabindex="-1"></a>*iii.OPTIONAL: Output standardized point <span class="kw">estimates</span> and difference*</span>
+<span id="cb205-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-76" tabindex="-1"></a>*The summary from the <span class="fu">last</span> command gives you the standardized <span class="kw">estimates</span>*</span>
+<span id="cb205-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-77" tabindex="-1"></a>*We can stop there, <span class="kw">or</span> we can ask Stata to calculate the standardized difference</span>
+<span id="cb205-78"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-78" tabindex="-1"></a>* and <span class="kw">display</span> <span class="ot">all</span> the results <span class="kw">in</span> a simple <span class="kw">table</span>*</span>
+<span id="cb205-79"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-79" tabindex="-1"></a>*The code below can <span class="kw">be</span> used <span class="kw">as</span>-is without changing any <span class="kw">variable</span> names*</span>
+<span id="cb205-80"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-80" tabindex="-1"></a>*The option <span class="st">&quot;quietly&quot;</span> asks Stata <span class="kw">not</span> to <span class="kw">display</span> the output <span class="kw">of</span> some intermediate</span>
+<span id="cb205-81"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-81" tabindex="-1"></a>* calculations*</span>
+<span id="cb205-82"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-82" tabindex="-1"></a>*You can <span class="kw">delete</span> <span class="kw">this</span> option <span class="kw">if</span> you want to see what is happening step-<span class="kw">by</span>-step*</span>
+<span id="cb205-83"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-83" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
+<span id="cb205-84"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-84" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb205-85"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-85" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
+<span id="cb205-86"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-86" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb205-87"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-87" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
+<span id="cb205-88"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-88" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb205-89"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-89" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
+<span id="cb205-90"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-90" tabindex="-1"></a></span>
+<span id="cb205-91"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-91" tabindex="-1"></a>*Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen*</span>
+<span id="cb205-92"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-92" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
+<span id="cb205-93"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-93" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
+<span id="cb205-94"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-94" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
+<span id="cb205-95"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-95" tabindex="-1"></a></span>
+<span id="cb205-96"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-96" tabindex="-1"></a>*to interpret these results:*</span>
+<span id="cb205-97"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-97" tabindex="-1"></a>*<span class="ot">row</span> 1, column 2, is the observed <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">in</span> our original <span class="kw">sample</span>*</span>
+<span id="cb205-98"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-98" tabindex="-1"></a>*<span class="ot">row</span> 2, column 2, is the <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">if</span> everyone had <span class="kw">not</span> quit smoking*</span>
+<span id="cb205-99"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-99" tabindex="-1"></a>*<span class="ot">row</span> 3, column 2, is the <span class="kw">mean</span> outcome <span class="ot">value</span> <span class="kw">if</span> everyone had quit smoking*</span>
+<span id="cb205-100"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-100" tabindex="-1"></a>*<span class="ot">row</span> 4, column 2, is the <span class="kw">mean</span> difference outcome <span class="ot">value</span> <span class="kw">if</span> everyone had quit </span>
+<span id="cb205-101"><a href="standardization-and-the-parametric-g-formula-stata.html#cb205-101" tabindex="-1"></a>* smoking compared to <span class="kw">if</span> everyone had <span class="kw">not</span> quit smoking*</span></code></pre></div>
 <pre><code>             ID          L          A          Y
   1. &quot;Rheia&quot;         0 0 0 
   2. &quot;Kronos&quot;        0 0 1 
@@ -665,101 +665,101 @@ <h2>Program 13.3<a href="standardization-and-the-parametric-g-formula-stata.html
 <li>Data from NHEFS</li>
 <li>Section 13.3</li>
 </ul>
-<div class="sourceCode" id="cb90"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb90-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
-<span id="cb90-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-2" tabindex="-1"></a></span>
-<span id="cb90-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-3" tabindex="-1"></a>*i.Data <span class="kw">set</span> up <span class="kw">for</span> standardization: create 3 copies <span class="kw">of</span> each subject*</span>
-<span id="cb90-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-4" tabindex="-1"></a>*first, duplicate the dataset and create a <span class="kw">variable</span> &#39;interv&#39; which indicates</span>
-<span id="cb90-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-5" tabindex="-1"></a>* which copy is the duplicate (interv =1)</span>
-<span id="cb90-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-6" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
-<span id="cb90-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-7" tabindex="-1"></a></span>
-<span id="cb90-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-8" tabindex="-1"></a>*next, duplicate the original copy (interv = 0) again, and create another</span>
-<span id="cb90-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-9" tabindex="-1"></a>* <span class="kw">variable</span> &#39;interv2&#39; to indicate the copy</span>
-<span id="cb90-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-10" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
-<span id="cb90-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-11" tabindex="-1"></a></span>
-<span id="cb90-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-12" tabindex="-1"></a>*now, change the <span class="ot">value</span> <span class="kw">of</span> &#39;interv&#39; to -1 <span class="kw">in</span> one <span class="kw">of</span> the copies so that there are</span>
-<span id="cb90-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-13" tabindex="-1"></a>* <span class="kw">unique</span> <span class="kw">values</span> <span class="kw">of</span> interv <span class="kw">for</span> each copy*</span>
-<span id="cb90-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-14" tabindex="-1"></a><span class="kw">replace</span> interv = -1  <span class="kw">if</span> interv2 ==1</span>
-<span id="cb90-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-15" tabindex="-1"></a><span class="kw">drop</span> interv2 </span>
-<span id="cb90-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-16" tabindex="-1"></a></span>
-<span id="cb90-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-17" tabindex="-1"></a>*check that the <span class="kw">data</span> has the structure you want: there should <span class="kw">be</span> 1566 people <span class="kw">in</span></span>
-<span id="cb90-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-18" tabindex="-1"></a>* each <span class="kw">of</span> the 3 <span class="kw">levels</span> <span class="kw">of</span> interv*</span>
-<span id="cb90-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-19" tabindex="-1"></a><span class="kw">tab</span> interv</span>
-<span id="cb90-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-20" tabindex="-1"></a></span>
-<span id="cb90-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-21" tabindex="-1"></a>*<span class="kw">two</span> <span class="kw">of</span> the copies will <span class="kw">be</span> <span class="kw">for</span> computing the standardized result*</span>
-<span id="cb90-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-22" tabindex="-1"></a>*<span class="kw">for</span> these <span class="kw">two</span> copies (interv = 0 and interv = 1), <span class="kw">set</span> the outcome to <span class="fu">missing</span></span>
-<span id="cb90-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-23" tabindex="-1"></a>* and <span class="kw">force</span> qsmk to either 0 <span class="kw">or</span> 1, respectively*</span>
-<span id="cb90-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-24" tabindex="-1"></a>*you may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> your outcome and exposure variables*</span>
-<span id="cb90-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-25" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv != -1</span>
-<span id="cb90-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-26" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv == 0</span>
-<span id="cb90-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-27" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv == 1</span>
-<span id="cb90-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-28" tabindex="-1"></a></span>
-<span id="cb90-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-29" tabindex="-1"></a>*check that the <span class="kw">data</span> has the structure you want: <span class="kw">for</span> interv = -1, some people</span>
-<span id="cb90-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-30" tabindex="-1"></a>* quit and some <span class="kw">do</span> <span class="kw">not</span>; <span class="kw">for</span> interv = 0 <span class="kw">or</span> 1, noone quits <span class="kw">or</span> everyone quits, respectively*</span>
-<span id="cb90-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-31" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> qsmk</span>
-<span id="cb90-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-32" tabindex="-1"></a></span>
-<span id="cb90-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-33" tabindex="-1"></a>*ii.Estimation <span class="kw">in</span> original <span class="kw">sample</span>*</span>
-<span id="cb90-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-34" tabindex="-1"></a>*Now, we <span class="kw">do</span> a parametric regression with the covariates we want to <span class="kw">adjust</span> <span class="kw">for</span>*</span>
-<span id="cb90-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-35" tabindex="-1"></a>*You may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> the variables you want.*</span>
-<span id="cb90-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-36" tabindex="-1"></a>*Because the copies have <span class="fu">missing</span> wt82_71, <span class="kw">this</span> will only <span class="kw">run</span> the regression <span class="kw">in</span> </span>
-<span id="cb90-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-37" tabindex="-1"></a>* the original copy*</span>
-<span id="cb90-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-38" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb90-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-39" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb90-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-40" tabindex="-1"></a>ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 qsmk#c.smokeintensity</span>
-<span id="cb90-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-41" tabindex="-1"></a></span>
-<span id="cb90-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-42" tabindex="-1"></a>*Ask Stata <span class="kw">for</span> expected <span class="kw">values</span> - Stata will give you expected <span class="kw">values</span> <span class="kw">for</span> <span class="ot">all</span> </span>
-<span id="cb90-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-43" tabindex="-1"></a>* copies, <span class="kw">not</span> just the original ones*</span>
-<span id="cb90-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-44" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
-<span id="cb90-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-45" tabindex="-1"></a></span>
-<span id="cb90-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-46" tabindex="-1"></a>*Now ask <span class="kw">for</span> a summary <span class="kw">of</span> these <span class="kw">values</span> <span class="kw">by</span> intervention*</span>
-<span id="cb90-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-47" tabindex="-1"></a>*These are the standardized outcome <span class="kw">estimates</span>: you can subtract them to <span class="fu">get</span> the</span>
-<span id="cb90-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-48" tabindex="-1"></a>* standardized difference*</span>
-<span id="cb90-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-49" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
-<span id="cb90-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-50" tabindex="-1"></a></span>
-<span id="cb90-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-51" tabindex="-1"></a><span class="co">/* iii.OPTIONAL: Output standardized point estimates and difference</span></span>
-<span id="cb90-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-52" tabindex="-1"></a><span class="co">- The summary from the last command gives you the </span></span>
-<span id="cb90-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-53" tabindex="-1"></a><span class="co">standardized estimates</span></span>
-<span id="cb90-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-54" tabindex="-1"></a><span class="co">- We can stop there, or we can ask Stata to calculate the </span></span>
-<span id="cb90-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-55" tabindex="-1"></a><span class="co">standardized difference and display all the results </span></span>
-<span id="cb90-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-56" tabindex="-1"></a><span class="co">in a simple table</span></span>
-<span id="cb90-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-57" tabindex="-1"></a><span class="co">- The code below can be used as-is without changing any</span></span>
-<span id="cb90-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-58" tabindex="-1"></a><span class="co">variable names</span></span>
-<span id="cb90-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-59" tabindex="-1"></a><span class="co">- The option `quietly` asks Stata not to display the output of </span></span>
-<span id="cb90-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-60" tabindex="-1"></a><span class="co">some intermediate calculations</span></span>
-<span id="cb90-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-61" tabindex="-1"></a><span class="co">- You can delete this option if you want to see what is </span></span>
-<span id="cb90-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-62" tabindex="-1"></a><span class="co">happening step-by-step */</span></span>
-<span id="cb90-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-63" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
-<span id="cb90-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-64" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb90-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-65" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
-<span id="cb90-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-66" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb90-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-67" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
-<span id="cb90-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-68" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
-<span id="cb90-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-69" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
-<span id="cb90-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-70" tabindex="-1"></a></span>
-<span id="cb90-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-71" tabindex="-1"></a>* Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen</span>
-<span id="cb90-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-72" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
-<span id="cb90-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-73" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
-<span id="cb90-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-74" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
-<span id="cb90-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-75" tabindex="-1"></a></span>
-<span id="cb90-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-76" tabindex="-1"></a><span class="co">/* To interpret these results:</span></span>
-<span id="cb90-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-77" tabindex="-1"></a><span class="co">- row 1, column 2, is the observed mean outcome value </span></span>
-<span id="cb90-78"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-78" tabindex="-1"></a><span class="co">in our original sample</span></span>
-<span id="cb90-79"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-79" tabindex="-1"></a><span class="co">- row 2, column 2, is the mean outcome value </span></span>
-<span id="cb90-80"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-80" tabindex="-1"></a><span class="co">if everyone had not quit smoking</span></span>
-<span id="cb90-81"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-81" tabindex="-1"></a><span class="co">- row 3, column 2, is the mean outcome value </span></span>
-<span id="cb90-82"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-82" tabindex="-1"></a><span class="co">if everyone had quit smoking</span></span>
-<span id="cb90-83"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-83" tabindex="-1"></a><span class="co">- row 4, column 2, is the mean difference outcome value </span></span>
-<span id="cb90-84"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-84" tabindex="-1"></a><span class="co">if everyone had quit smoking compared to if everyone </span></span>
-<span id="cb90-85"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-85" tabindex="-1"></a><span class="co">had not quit smoking */</span></span>
-<span id="cb90-86"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-86" tabindex="-1"></a></span>
-<span id="cb90-87"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-87" tabindex="-1"></a><span class="co">/* Addition due to way Statamarkdown works </span></span>
-<span id="cb90-88"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-88" tabindex="-1"></a><span class="co">i.e. each code chunk is a separate Stata session */</span></span>
-<span id="cb90-89"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-89" tabindex="-1"></a><span class="kw">mata</span> observe = st_matrix(<span class="st">&quot;observe&quot;</span>)</span>
-<span id="cb90-90"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-90" tabindex="-1"></a><span class="kw">mata</span> <span class="kw">mata</span> matsave ./<span class="kw">data</span>/observe observe, <span class="kw">replace</span></span>
-<span id="cb90-91"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-91" tabindex="-1"></a></span>
-<span id="cb90-92"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-92" tabindex="-1"></a>*<span class="kw">drop</span> the copies*</span>
-<span id="cb90-93"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-93" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> interv != -1</span>
-<span id="cb90-94"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-94" tabindex="-1"></a><span class="kw">gen</span> meanY_b =.</span>
-<span id="cb90-95"><a href="standardization-and-the-parametric-g-formula-stata.html#cb90-95" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb207"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb207-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-1" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs-formatted, <span class="kw">clear</span></span>
+<span id="cb207-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-2" tabindex="-1"></a></span>
+<span id="cb207-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-3" tabindex="-1"></a>*i.Data <span class="kw">set</span> up <span class="kw">for</span> standardization: create 3 copies <span class="kw">of</span> each subject*</span>
+<span id="cb207-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-4" tabindex="-1"></a>*first, duplicate the dataset and create a <span class="kw">variable</span> &#39;interv&#39; which indicates</span>
+<span id="cb207-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-5" tabindex="-1"></a>* which copy is the duplicate (interv =1)</span>
+<span id="cb207-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-6" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv)</span>
+<span id="cb207-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-7" tabindex="-1"></a></span>
+<span id="cb207-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-8" tabindex="-1"></a>*next, duplicate the original copy (interv = 0) again, and create another</span>
+<span id="cb207-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-9" tabindex="-1"></a>* <span class="kw">variable</span> &#39;interv2&#39; to indicate the copy</span>
+<span id="cb207-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-10" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv == 0, <span class="kw">generate</span>(interv2)</span>
+<span id="cb207-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-11" tabindex="-1"></a></span>
+<span id="cb207-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-12" tabindex="-1"></a>*now, change the <span class="ot">value</span> <span class="kw">of</span> &#39;interv&#39; to -1 <span class="kw">in</span> one <span class="kw">of</span> the copies so that there are</span>
+<span id="cb207-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-13" tabindex="-1"></a>* <span class="kw">unique</span> <span class="kw">values</span> <span class="kw">of</span> interv <span class="kw">for</span> each copy*</span>
+<span id="cb207-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-14" tabindex="-1"></a><span class="kw">replace</span> interv = -1  <span class="kw">if</span> interv2 ==1</span>
+<span id="cb207-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-15" tabindex="-1"></a><span class="kw">drop</span> interv2 </span>
+<span id="cb207-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-16" tabindex="-1"></a></span>
+<span id="cb207-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-17" tabindex="-1"></a>*check that the <span class="kw">data</span> has the structure you want: there should <span class="kw">be</span> 1566 people <span class="kw">in</span></span>
+<span id="cb207-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-18" tabindex="-1"></a>* each <span class="kw">of</span> the 3 <span class="kw">levels</span> <span class="kw">of</span> interv*</span>
+<span id="cb207-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-19" tabindex="-1"></a><span class="kw">tab</span> interv</span>
+<span id="cb207-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-20" tabindex="-1"></a></span>
+<span id="cb207-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-21" tabindex="-1"></a>*<span class="kw">two</span> <span class="kw">of</span> the copies will <span class="kw">be</span> <span class="kw">for</span> computing the standardized result*</span>
+<span id="cb207-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-22" tabindex="-1"></a>*<span class="kw">for</span> these <span class="kw">two</span> copies (interv = 0 and interv = 1), <span class="kw">set</span> the outcome to <span class="fu">missing</span></span>
+<span id="cb207-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-23" tabindex="-1"></a>* and <span class="kw">force</span> qsmk to either 0 <span class="kw">or</span> 1, respectively*</span>
+<span id="cb207-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-24" tabindex="-1"></a>*you may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> your outcome and exposure variables*</span>
+<span id="cb207-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-25" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv != -1</span>
+<span id="cb207-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-26" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv == 0</span>
+<span id="cb207-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-27" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv == 1</span>
+<span id="cb207-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-28" tabindex="-1"></a></span>
+<span id="cb207-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-29" tabindex="-1"></a>*check that the <span class="kw">data</span> has the structure you want: <span class="kw">for</span> interv = -1, some people</span>
+<span id="cb207-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-30" tabindex="-1"></a>* quit and some <span class="kw">do</span> <span class="kw">not</span>; <span class="kw">for</span> interv = 0 <span class="kw">or</span> 1, noone quits <span class="kw">or</span> everyone quits, respectively*</span>
+<span id="cb207-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-31" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> qsmk</span>
+<span id="cb207-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-32" tabindex="-1"></a></span>
+<span id="cb207-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-33" tabindex="-1"></a>*ii.Estimation <span class="kw">in</span> original <span class="kw">sample</span>*</span>
+<span id="cb207-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-34" tabindex="-1"></a>*Now, we <span class="kw">do</span> a parametric regression with the covariates we want to <span class="kw">adjust</span> <span class="kw">for</span>*</span>
+<span id="cb207-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-35" tabindex="-1"></a>*You may need to edit <span class="kw">this</span> part <span class="kw">of</span> the code <span class="kw">for</span> the variables you want.*</span>
+<span id="cb207-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-36" tabindex="-1"></a>*Because the copies have <span class="fu">missing</span> wt82_71, <span class="kw">this</span> will only <span class="kw">run</span> the regression <span class="kw">in</span> </span>
+<span id="cb207-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-37" tabindex="-1"></a>* the original copy*</span>
+<span id="cb207-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-38" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb207-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-39" tabindex="-1"></a>c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb207-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-40" tabindex="-1"></a>ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 qsmk#c.smokeintensity</span>
+<span id="cb207-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-41" tabindex="-1"></a></span>
+<span id="cb207-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-42" tabindex="-1"></a>*Ask Stata <span class="kw">for</span> expected <span class="kw">values</span> - Stata will give you expected <span class="kw">values</span> <span class="kw">for</span> <span class="ot">all</span> </span>
+<span id="cb207-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-43" tabindex="-1"></a>* copies, <span class="kw">not</span> just the original ones*</span>
+<span id="cb207-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-44" tabindex="-1"></a><span class="kw">predict</span> predY, <span class="kw">xb</span></span>
+<span id="cb207-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-45" tabindex="-1"></a></span>
+<span id="cb207-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-46" tabindex="-1"></a>*Now ask <span class="kw">for</span> a summary <span class="kw">of</span> these <span class="kw">values</span> <span class="kw">by</span> intervention*</span>
+<span id="cb207-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-47" tabindex="-1"></a>*These are the standardized outcome <span class="kw">estimates</span>: you can subtract them to <span class="fu">get</span> the</span>
+<span id="cb207-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-48" tabindex="-1"></a>* standardized difference*</span>
+<span id="cb207-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-49" tabindex="-1"></a><span class="kw">by</span> interv, <span class="kw">sort</span>: <span class="kw">summarize</span> predY</span>
+<span id="cb207-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-50" tabindex="-1"></a></span>
+<span id="cb207-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-51" tabindex="-1"></a><span class="co">/* iii.OPTIONAL: Output standardized point estimates and difference</span></span>
+<span id="cb207-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-52" tabindex="-1"></a><span class="co">- The summary from the last command gives you the </span></span>
+<span id="cb207-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-53" tabindex="-1"></a><span class="co">standardized estimates</span></span>
+<span id="cb207-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-54" tabindex="-1"></a><span class="co">- We can stop there, or we can ask Stata to calculate the </span></span>
+<span id="cb207-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-55" tabindex="-1"></a><span class="co">standardized difference and display all the results </span></span>
+<span id="cb207-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-56" tabindex="-1"></a><span class="co">in a simple table</span></span>
+<span id="cb207-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-57" tabindex="-1"></a><span class="co">- The code below can be used as-is without changing any</span></span>
+<span id="cb207-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-58" tabindex="-1"></a><span class="co">variable names</span></span>
+<span id="cb207-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-59" tabindex="-1"></a><span class="co">- The option `quietly` asks Stata not to display the output of </span></span>
+<span id="cb207-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-60" tabindex="-1"></a><span class="co">some intermediate calculations</span></span>
+<span id="cb207-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-61" tabindex="-1"></a><span class="co">- You can delete this option if you want to see what is </span></span>
+<span id="cb207-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-62" tabindex="-1"></a><span class="co">happening step-by-step */</span></span>
+<span id="cb207-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-63" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == -1)</span>
+<span id="cb207-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-64" tabindex="-1"></a><span class="fu">matrix</span> input observe = (-1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb207-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-65" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 0)</span>
+<span id="cb207-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-66" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \0,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb207-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-67" tabindex="-1"></a><span class="kw">quietly</span> <span class="kw">summarize</span> predY <span class="kw">if</span>(interv == 1)</span>
+<span id="cb207-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-68" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \1,<span class="ot">`r(mean)&#39;</span>)</span>
+<span id="cb207-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-69" tabindex="-1"></a><span class="fu">matrix</span> observe = (observe \., observe[3,2]-observe[2,2]) </span>
+<span id="cb207-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-70" tabindex="-1"></a></span>
+<span id="cb207-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-71" tabindex="-1"></a>* Add some <span class="ot">row</span>/column descriptions and <span class="kw">print</span> results to screen</span>
+<span id="cb207-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-72" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">rownames</span> observe = observed E(Y(a=0)) E(Y(a=1)) difference</span>
+<span id="cb207-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-73" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">colnames</span> observe = interv <span class="ot">value</span></span>
+<span id="cb207-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-74" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> observe </span>
+<span id="cb207-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-75" tabindex="-1"></a></span>
+<span id="cb207-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-76" tabindex="-1"></a><span class="co">/* To interpret these results:</span></span>
+<span id="cb207-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-77" tabindex="-1"></a><span class="co">- row 1, column 2, is the observed mean outcome value </span></span>
+<span id="cb207-78"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-78" tabindex="-1"></a><span class="co">in our original sample</span></span>
+<span id="cb207-79"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-79" tabindex="-1"></a><span class="co">- row 2, column 2, is the mean outcome value </span></span>
+<span id="cb207-80"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-80" tabindex="-1"></a><span class="co">if everyone had not quit smoking</span></span>
+<span id="cb207-81"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-81" tabindex="-1"></a><span class="co">- row 3, column 2, is the mean outcome value </span></span>
+<span id="cb207-82"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-82" tabindex="-1"></a><span class="co">if everyone had quit smoking</span></span>
+<span id="cb207-83"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-83" tabindex="-1"></a><span class="co">- row 4, column 2, is the mean difference outcome value </span></span>
+<span id="cb207-84"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-84" tabindex="-1"></a><span class="co">if everyone had quit smoking compared to if everyone </span></span>
+<span id="cb207-85"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-85" tabindex="-1"></a><span class="co">had not quit smoking */</span></span>
+<span id="cb207-86"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-86" tabindex="-1"></a></span>
+<span id="cb207-87"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-87" tabindex="-1"></a><span class="co">/* Addition due to way Statamarkdown works </span></span>
+<span id="cb207-88"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-88" tabindex="-1"></a><span class="co">i.e. each code chunk is a separate Stata session */</span></span>
+<span id="cb207-89"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-89" tabindex="-1"></a><span class="kw">mata</span> observe = st_matrix(<span class="st">&quot;observe&quot;</span>)</span>
+<span id="cb207-90"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-90" tabindex="-1"></a><span class="kw">mata</span> <span class="kw">mata</span> matsave ./<span class="kw">data</span>/observe observe, <span class="kw">replace</span></span>
+<span id="cb207-91"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-91" tabindex="-1"></a></span>
+<span id="cb207-92"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-92" tabindex="-1"></a>*<span class="kw">drop</span> the copies*</span>
+<span id="cb207-93"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-93" tabindex="-1"></a><span class="kw">drop</span> <span class="kw">if</span> interv != -1</span>
+<span id="cb207-94"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-94" tabindex="-1"></a><span class="kw">gen</span> meanY_b =.</span>
+<span id="cb207-95"><a href="standardization-and-the-parametric-g-formula-stata.html#cb207-95" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>(1,566 observations created)
 
 (1,566 observations created)
@@ -912,83 +912,83 @@ <h2>Program 13.4<a href="standardization-and-the-parametric-g-formula-stata.html
 <li>Computing the 95% confidence interval of the standardized means and their difference: Data from NHEFS</li>
 <li>Section 13.3</li>
 </ul>
-<div class="sourceCode" id="cb92"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb92-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-1" tabindex="-1"></a>*Run <span class="kw">program</span> 13.3 to obtain point <span class="kw">estimates</span>, and then the code below*</span>
-<span id="cb92-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-2" tabindex="-1"></a></span>
-<span id="cb92-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-3" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz</span>
-<span id="cb92-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-4" tabindex="-1"></a></span>
-<span id="cb92-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-5" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz, rclass</span>
-<span id="cb92-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-6" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">clear</span></span>
-<span id="cb92-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-7" tabindex="-1"></a></span>
-<span id="cb92-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-8" tabindex="-1"></a><span class="kw">preserve</span></span>
-<span id="cb92-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-9" tabindex="-1"></a></span>
-<span id="cb92-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-10" tabindex="-1"></a>* Draw <span class="kw">bootstrap</span> <span class="kw">sample</span> from original observations</span>
-<span id="cb92-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-11" tabindex="-1"></a><span class="kw">bsample</span> </span>
-<span id="cb92-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-12" tabindex="-1"></a>        </span>
-<span id="cb92-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-13" tabindex="-1"></a><span class="co">/* Create copies with each value of qsmk in bootstrap sample.</span></span>
-<span id="cb92-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-14" tabindex="-1"></a><span class="co">First, duplicate the dataset and create a variable `interv` which</span></span>
-<span id="cb92-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-15" tabindex="-1"></a><span class="co">indicates which copy is the duplicate (interv =1)*/</span></span>
-<span id="cb92-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-16" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv_b)</span>
-<span id="cb92-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-17" tabindex="-1"></a></span>
-<span id="cb92-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-18" tabindex="-1"></a><span class="co">/* Next, duplicate the original copy (interv = 0) again, and create</span></span>
-<span id="cb92-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-19" tabindex="-1"></a><span class="co">another variable `interv2` to indicate the copy*/</span></span>
-<span id="cb92-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-20" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv_b == 0, <span class="kw">generate</span>(interv2_b)</span>
-<span id="cb92-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-21" tabindex="-1"></a></span>
-<span id="cb92-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-22" tabindex="-1"></a><span class="co">/* Now, change the value of interv to -1 in one of the copies so that</span></span>
-<span id="cb92-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-23" tabindex="-1"></a><span class="co">there are unique values of interv for each copy*/</span></span>
-<span id="cb92-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-24" tabindex="-1"></a><span class="kw">replace</span> interv_b = -1  <span class="kw">if</span> interv2_b ==1</span>
-<span id="cb92-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-25" tabindex="-1"></a><span class="kw">drop</span> interv2_b</span>
-<span id="cb92-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-26" tabindex="-1"></a></span>
-<span id="cb92-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-27" tabindex="-1"></a><span class="co">/* Two of the copies will be for computing the standardized result.</span></span>
-<span id="cb92-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-28" tabindex="-1"></a><span class="co">For these two copies (interv = 0 and interv = 1), set the outcome to</span></span>
-<span id="cb92-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-29" tabindex="-1"></a><span class="co">missing and force qsmk to either 0 or 1, respectively*/</span></span>
-<span id="cb92-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-30" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv_b != -1</span>
-<span id="cb92-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-31" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv_b == 0</span>
-<span id="cb92-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-32" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv_b == 1</span>
-<span id="cb92-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-33" tabindex="-1"></a></span>
-<span id="cb92-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-34" tabindex="-1"></a>* Run regression</span>
-<span id="cb92-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-35" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
-<span id="cb92-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-36" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
-<span id="cb92-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-37" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
-<span id="cb92-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-38" tabindex="-1"></a>  qsmk#c.smokeintensity</span>
-<span id="cb92-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-39" tabindex="-1"></a></span>
-<span id="cb92-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-40" tabindex="-1"></a><span class="co">/* Ask Stata for expected values.</span></span>
-<span id="cb92-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-41" tabindex="-1"></a><span class="co">Stata will give you expected values for all copies, not just the</span></span>
-<span id="cb92-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-42" tabindex="-1"></a><span class="co">original ones*/</span></span>
-<span id="cb92-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-43" tabindex="-1"></a><span class="kw">predict</span> predY_b, <span class="kw">xb</span></span>
-<span id="cb92-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-44" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 0</span>
-<span id="cb92-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-45" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
-<span id="cb92-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-46" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 1</span>
-<span id="cb92-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-47" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
-<span id="cb92-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-48" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
-<span id="cb92-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-49" tabindex="-1"></a><span class="kw">drop</span> meanY_b</span>
-<span id="cb92-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-50" tabindex="-1"></a></span>
-<span id="cb92-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-51" tabindex="-1"></a><span class="kw">restore</span></span>
-<span id="cb92-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-52" tabindex="-1"></a></span>
-<span id="cb92-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-53" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb92-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-54" tabindex="-1"></a></span>
-<span id="cb92-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-55" tabindex="-1"></a><span class="co">/* Then we use the `simulate` command to run the bootstraps as many</span></span>
-<span id="cb92-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-56" tabindex="-1"></a><span class="co">times as we want.</span></span>
-<span id="cb92-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-57" tabindex="-1"></a><span class="co">Start with reps(10) to make sure your code runs, and then change to</span></span>
-<span id="cb92-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-58" tabindex="-1"></a><span class="co">reps(1000) to generate your final CIs.*/</span></span>
-<span id="cb92-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-59" tabindex="-1"></a><span class="kw">simulate</span> EY_a0=<span class="fu">r</span>(boot_0) EY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
-<span id="cb92-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-60" tabindex="-1"></a>  difference = <span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootstdz</span>
-<span id="cb92-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-61" tabindex="-1"></a></span>
-<span id="cb92-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-62" tabindex="-1"></a><span class="co">/* Next, format the point estimate to allow Stata to calculate our</span></span>
-<span id="cb92-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-63" tabindex="-1"></a><span class="co">standard errors and confidence intervals*/</span></span>
-<span id="cb92-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-64" tabindex="-1"></a>  </span>
-<span id="cb92-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-65" tabindex="-1"></a>* Addition: read back <span class="kw">in</span> the observe <span class="fu">matrix</span>  </span>
-<span id="cb92-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-66" tabindex="-1"></a><span class="kw">mata</span> <span class="kw">mata</span> matuse ./<span class="kw">data</span>/observe, <span class="kw">replace</span></span>
-<span id="cb92-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-67" tabindex="-1"></a><span class="kw">mata</span> st_matrix(<span class="st">&quot;observe&quot;</span>, observe)</span>
-<span id="cb92-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-68" tabindex="-1"></a></span>
-<span id="cb92-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-69" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[2..4, 2]&#39;</span>
-<span id="cb92-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-70" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pe</span>
-<span id="cb92-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-71" tabindex="-1"></a></span>
-<span id="cb92-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-72" tabindex="-1"></a><span class="co">/* Finally, the bstat command generates valid 95% confidence intervals</span></span>
-<span id="cb92-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-73" tabindex="-1"></a><span class="co">under the normal approximation using our bootstrap results.</span></span>
-<span id="cb92-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-74" tabindex="-1"></a><span class="co">The default results use a normal approximation to calcutlate the</span></span>
-<span id="cb92-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-75" tabindex="-1"></a><span class="co">confidence intervals.</span></span>
-<span id="cb92-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-76" tabindex="-1"></a><span class="co">Note, n contains the original sample size of your data before censoring*/</span></span>
-<span id="cb92-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb92-77" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629) </span></code></pre></div>
+<div class="sourceCode" id="cb209"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb209-1"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-1" tabindex="-1"></a>*Run <span class="kw">program</span> 13.3 to obtain point <span class="kw">estimates</span>, and then the code below*</span>
+<span id="cb209-2"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-2" tabindex="-1"></a></span>
+<span id="cb209-3"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-3" tabindex="-1"></a><span class="kw">capture</span> <span class="kw">program</span> <span class="kw">drop</span> bootstdz</span>
+<span id="cb209-4"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-4" tabindex="-1"></a></span>
+<span id="cb209-5"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-5" tabindex="-1"></a><span class="kw">program</span> <span class="kw">define</span> bootstdz, rclass</span>
+<span id="cb209-6"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-6" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/nhefs_std, <span class="kw">clear</span></span>
+<span id="cb209-7"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-7" tabindex="-1"></a></span>
+<span id="cb209-8"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-8" tabindex="-1"></a><span class="kw">preserve</span></span>
+<span id="cb209-9"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-9" tabindex="-1"></a></span>
+<span id="cb209-10"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-10" tabindex="-1"></a>* Draw <span class="kw">bootstrap</span> <span class="kw">sample</span> from original observations</span>
+<span id="cb209-11"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-11" tabindex="-1"></a><span class="kw">bsample</span> </span>
+<span id="cb209-12"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-12" tabindex="-1"></a>        </span>
+<span id="cb209-13"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-13" tabindex="-1"></a><span class="co">/* Create copies with each value of qsmk in bootstrap sample.</span></span>
+<span id="cb209-14"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-14" tabindex="-1"></a><span class="co">First, duplicate the dataset and create a variable `interv` which</span></span>
+<span id="cb209-15"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-15" tabindex="-1"></a><span class="co">indicates which copy is the duplicate (interv =1)*/</span></span>
+<span id="cb209-16"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-16" tabindex="-1"></a>expand 2, <span class="kw">generate</span>(interv_b)</span>
+<span id="cb209-17"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-17" tabindex="-1"></a></span>
+<span id="cb209-18"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-18" tabindex="-1"></a><span class="co">/* Next, duplicate the original copy (interv = 0) again, and create</span></span>
+<span id="cb209-19"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-19" tabindex="-1"></a><span class="co">another variable `interv2` to indicate the copy*/</span></span>
+<span id="cb209-20"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-20" tabindex="-1"></a>expand 2 <span class="kw">if</span> interv_b == 0, <span class="kw">generate</span>(interv2_b)</span>
+<span id="cb209-21"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-21" tabindex="-1"></a></span>
+<span id="cb209-22"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-22" tabindex="-1"></a><span class="co">/* Now, change the value of interv to -1 in one of the copies so that</span></span>
+<span id="cb209-23"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-23" tabindex="-1"></a><span class="co">there are unique values of interv for each copy*/</span></span>
+<span id="cb209-24"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-24" tabindex="-1"></a><span class="kw">replace</span> interv_b = -1  <span class="kw">if</span> interv2_b ==1</span>
+<span id="cb209-25"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-25" tabindex="-1"></a><span class="kw">drop</span> interv2_b</span>
+<span id="cb209-26"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-26" tabindex="-1"></a></span>
+<span id="cb209-27"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-27" tabindex="-1"></a><span class="co">/* Two of the copies will be for computing the standardized result.</span></span>
+<span id="cb209-28"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-28" tabindex="-1"></a><span class="co">For these two copies (interv = 0 and interv = 1), set the outcome to</span></span>
+<span id="cb209-29"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-29" tabindex="-1"></a><span class="co">missing and force qsmk to either 0 or 1, respectively*/</span></span>
+<span id="cb209-30"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-30" tabindex="-1"></a><span class="kw">replace</span> wt82_71 = . <span class="kw">if</span> interv_b != -1</span>
+<span id="cb209-31"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-31" tabindex="-1"></a><span class="kw">replace</span> qsmk = 0 <span class="kw">if</span> interv_b == 0</span>
+<span id="cb209-32"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-32" tabindex="-1"></a><span class="kw">replace</span> qsmk = 1 <span class="kw">if</span> interv_b == 1</span>
+<span id="cb209-33"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-33" tabindex="-1"></a></span>
+<span id="cb209-34"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-34" tabindex="-1"></a>* Run regression</span>
+<span id="cb209-35"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-35" tabindex="-1"></a><span class="kw">regress</span> wt82_71 qsmk sex race c.age##c.age ib(<span class="fu">last</span>).education <span class="co">///</span></span>
+<span id="cb209-36"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-36" tabindex="-1"></a>  c.smokeintensity##c.smokeintensity c.smokeyrs##c.smokeyrs <span class="co">///</span></span>
+<span id="cb209-37"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-37" tabindex="-1"></a>  ib(<span class="fu">last</span>).exercise ib(<span class="fu">last</span>).active c.wt71##c.wt71 <span class="co">///</span></span>
+<span id="cb209-38"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-38" tabindex="-1"></a>  qsmk#c.smokeintensity</span>
+<span id="cb209-39"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-39" tabindex="-1"></a></span>
+<span id="cb209-40"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-40" tabindex="-1"></a><span class="co">/* Ask Stata for expected values.</span></span>
+<span id="cb209-41"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-41" tabindex="-1"></a><span class="co">Stata will give you expected values for all copies, not just the</span></span>
+<span id="cb209-42"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-42" tabindex="-1"></a><span class="co">original ones*/</span></span>
+<span id="cb209-43"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-43" tabindex="-1"></a><span class="kw">predict</span> predY_b, <span class="kw">xb</span></span>
+<span id="cb209-44"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-44" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 0</span>
+<span id="cb209-45"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-45" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_0 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
+<span id="cb209-46"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-46" tabindex="-1"></a><span class="kw">summarize</span> predY_b <span class="kw">if</span> interv_b == 1</span>
+<span id="cb209-47"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-47" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_1 = <span class="fu">r</span>(<span class="kw">mean</span>)</span>
+<span id="cb209-48"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-48" tabindex="-1"></a><span class="fu">return</span> <span class="fu">scalar</span> boot_diff = <span class="fu">return</span>(boot_1) - <span class="fu">return</span>(boot_0)</span>
+<span id="cb209-49"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-49" tabindex="-1"></a><span class="kw">drop</span> meanY_b</span>
+<span id="cb209-50"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-50" tabindex="-1"></a></span>
+<span id="cb209-51"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-51" tabindex="-1"></a><span class="kw">restore</span></span>
+<span id="cb209-52"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-52" tabindex="-1"></a></span>
+<span id="cb209-53"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-53" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb209-54"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-54" tabindex="-1"></a></span>
+<span id="cb209-55"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-55" tabindex="-1"></a><span class="co">/* Then we use the `simulate` command to run the bootstraps as many</span></span>
+<span id="cb209-56"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-56" tabindex="-1"></a><span class="co">times as we want.</span></span>
+<span id="cb209-57"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-57" tabindex="-1"></a><span class="co">Start with reps(10) to make sure your code runs, and then change to</span></span>
+<span id="cb209-58"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-58" tabindex="-1"></a><span class="co">reps(1000) to generate your final CIs.*/</span></span>
+<span id="cb209-59"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-59" tabindex="-1"></a><span class="kw">simulate</span> EY_a0=<span class="fu">r</span>(boot_0) EY_a1 = <span class="fu">r</span>(boot_1) <span class="co">///</span></span>
+<span id="cb209-60"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-60" tabindex="-1"></a>  difference = <span class="fu">r</span>(boot_diff), reps(10) <span class="dv">seed</span>(1): bootstdz</span>
+<span id="cb209-61"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-61" tabindex="-1"></a></span>
+<span id="cb209-62"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-62" tabindex="-1"></a><span class="co">/* Next, format the point estimate to allow Stata to calculate our</span></span>
+<span id="cb209-63"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-63" tabindex="-1"></a><span class="co">standard errors and confidence intervals*/</span></span>
+<span id="cb209-64"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-64" tabindex="-1"></a>  </span>
+<span id="cb209-65"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-65" tabindex="-1"></a>* Addition: read back <span class="kw">in</span> the observe <span class="fu">matrix</span>  </span>
+<span id="cb209-66"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-66" tabindex="-1"></a><span class="kw">mata</span> <span class="kw">mata</span> matuse ./<span class="kw">data</span>/observe, <span class="kw">replace</span></span>
+<span id="cb209-67"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-67" tabindex="-1"></a><span class="kw">mata</span> st_matrix(<span class="st">&quot;observe&quot;</span>, observe)</span>
+<span id="cb209-68"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-68" tabindex="-1"></a></span>
+<span id="cb209-69"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-69" tabindex="-1"></a><span class="fu">matrix</span> pe = observe[2..4, 2]&#39;</span>
+<span id="cb209-70"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-70" tabindex="-1"></a><span class="fu">matrix</span> <span class="ot">list</span> pe</span>
+<span id="cb209-71"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-71" tabindex="-1"></a></span>
+<span id="cb209-72"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-72" tabindex="-1"></a><span class="co">/* Finally, the bstat command generates valid 95% confidence intervals</span></span>
+<span id="cb209-73"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-73" tabindex="-1"></a><span class="co">under the normal approximation using our bootstrap results.</span></span>
+<span id="cb209-74"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-74" tabindex="-1"></a><span class="co">The default results use a normal approximation to calcutlate the</span></span>
+<span id="cb209-75"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-75" tabindex="-1"></a><span class="co">confidence intervals.</span></span>
+<span id="cb209-76"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-76" tabindex="-1"></a><span class="co">Note, n contains the original sample size of your data before censoring*/</span></span>
+<span id="cb209-77"><a href="standardization-and-the-parametric-g-formula-stata.html#cb209-77" tabindex="-1"></a><span class="kw">bstat</span>, stat(pe) n(1629) </span></code></pre></div>
 <pre><code> 12. 
 
       Command: bootstdz
diff --git a/docs/standardization-and-the-parametric-g-formula.html b/docs/standardization-and-the-parametric-g-formula.html
index 2d766e8..50c6493 100644
--- a/docs/standardization-and-the-parametric-g-formula.html
+++ b/docs/standardization-and-the-parametric-g-formula.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -316,92 +316,92 @@ <h2>Program 13.1<a href="standardization-and-the-parametric-g-formula.html#progr
 <li>Estimating the mean outcome within levels of treatment and confounders</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb18"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb18-1"><a href="standardization-and-the-parametric-g-formula.html#cb18-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
-<div class="sourceCode" id="cb19"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb19-1"><a href="standardization-and-the-parametric-g-formula.html#cb19-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
-<span id="cb19-2"><a href="standardization-and-the-parametric-g-formula.html#cb19-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
-<span id="cb19-3"><a href="standardization-and-the-parametric-g-formula.html#cb19-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
-<span id="cb19-4"><a href="standardization-and-the-parametric-g-formula.html#cb19-4" tabindex="-1"></a></span>
-<span id="cb19-5"><a href="standardization-and-the-parametric-g-formula.html#cb19-5" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
-<span id="cb19-6"><a href="standardization-and-the-parametric-g-formula.html#cb19-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
-<span id="cb19-7"><a href="standardization-and-the-parametric-g-formula.html#cb19-7" tabindex="-1"></a></span>
-<span id="cb19-8"><a href="standardization-and-the-parametric-g-formula.html#cb19-8" tabindex="-1"></a>fit <span class="ot">&lt;-</span></span>
-<span id="cb19-9"><a href="standardization-and-the-parametric-g-formula.html#cb19-9" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
-<span id="cb19-10"><a href="standardization-and-the-parametric-g-formula.html#cb19-10" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
-<span id="cb19-11"><a href="standardization-and-the-parametric-g-formula.html#cb19-11" tabindex="-1"></a>    <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb19-12"><a href="standardization-and-the-parametric-g-formula.html#cb19-12" tabindex="-1"></a>    <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span> smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
-<span id="cb19-13"><a href="standardization-and-the-parametric-g-formula.html#cb19-13" tabindex="-1"></a>    <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span> wt71) <span class="sc">+</span> qsmk <span class="sc">*</span> smokeintensity,</span>
-<span id="cb19-14"><a href="standardization-and-the-parametric-g-formula.html#cb19-14" tabindex="-1"></a>    <span class="at">data =</span> nhefs</span>
-<span id="cb19-15"><a href="standardization-and-the-parametric-g-formula.html#cb19-15" tabindex="-1"></a>  )</span>
-<span id="cb19-16"><a href="standardization-and-the-parametric-g-formula.html#cb19-16" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
-<span id="cb19-17"><a href="standardization-and-the-parametric-g-formula.html#cb19-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb19-18"><a href="standardization-and-the-parametric-g-formula.html#cb19-18" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb19-19"><a href="standardization-and-the-parametric-g-formula.html#cb19-19" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb19-20"><a href="standardization-and-the-parametric-g-formula.html#cb19-20" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb19-21"><a href="standardization-and-the-parametric-g-formula.html#cb19-21" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb19-22"><a href="standardization-and-the-parametric-g-formula.html#cb19-22" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, </span></span>
-<span id="cb19-23"><a href="standardization-and-the-parametric-g-formula.html#cb19-23" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
-<span id="cb19-24"><a href="standardization-and-the-parametric-g-formula.html#cb19-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb19-25"><a href="standardization-and-the-parametric-g-formula.html#cb19-25" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb19-26"><a href="standardization-and-the-parametric-g-formula.html#cb19-26" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb19-27"><a href="standardization-and-the-parametric-g-formula.html#cb19-27" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
-<span id="cb19-28"><a href="standardization-and-the-parametric-g-formula.html#cb19-28" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
-<span id="cb19-29"><a href="standardization-and-the-parametric-g-formula.html#cb19-29" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
-<span id="cb19-30"><a href="standardization-and-the-parametric-g-formula.html#cb19-30" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
-<span id="cb19-31"><a href="standardization-and-the-parametric-g-formula.html#cb19-31" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
-<span id="cb19-32"><a href="standardization-and-the-parametric-g-formula.html#cb19-32" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
-<span id="cb19-33"><a href="standardization-and-the-parametric-g-formula.html#cb19-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
-<span id="cb19-34"><a href="standardization-and-the-parametric-g-formula.html#cb19-34" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
-<span id="cb19-35"><a href="standardization-and-the-parametric-g-formula.html#cb19-35" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
-<span id="cb19-36"><a href="standardization-and-the-parametric-g-formula.html#cb19-36" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
-<span id="cb19-37"><a href="standardization-and-the-parametric-g-formula.html#cb19-37" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
-<span id="cb19-38"><a href="standardization-and-the-parametric-g-formula.html#cb19-38" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
-<span id="cb19-39"><a href="standardization-and-the-parametric-g-formula.html#cb19-39" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
-<span id="cb19-40"><a href="standardization-and-the-parametric-g-formula.html#cb19-40" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
-<span id="cb19-41"><a href="standardization-and-the-parametric-g-formula.html#cb19-41" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
-<span id="cb19-42"><a href="standardization-and-the-parametric-g-formula.html#cb19-42" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
-<span id="cb19-43"><a href="standardization-and-the-parametric-g-formula.html#cb19-43" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
-<span id="cb19-44"><a href="standardization-and-the-parametric-g-formula.html#cb19-44" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
-<span id="cb19-45"><a href="standardization-and-the-parametric-g-formula.html#cb19-45" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
-<span id="cb19-46"><a href="standardization-and-the-parametric-g-formula.html#cb19-46" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
-<span id="cb19-47"><a href="standardization-and-the-parametric-g-formula.html#cb19-47" tabindex="-1"></a><span class="co">#&gt; qsmk:smokeintensity                 0.0466628  0.0351448   1.328 0.184463    </span></span>
-<span id="cb19-48"><a href="standardization-and-the-parametric-g-formula.html#cb19-48" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb19-49"><a href="standardization-and-the-parametric-g-formula.html#cb19-49" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb19-50"><a href="standardization-and-the-parametric-g-formula.html#cb19-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb19-51"><a href="standardization-and-the-parametric-g-formula.html#cb19-51" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
-<span id="cb19-52"><a href="standardization-and-the-parametric-g-formula.html#cb19-52" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb19-53"><a href="standardization-and-the-parametric-g-formula.html#cb19-53" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb19-54"><a href="standardization-and-the-parametric-g-formula.html#cb19-54" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
-<span id="cb19-55"><a href="standardization-and-the-parametric-g-formula.html#cb19-55" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
-<span id="cb19-56"><a href="standardization-and-the-parametric-g-formula.html#cb19-56" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
-<span id="cb19-57"><a href="standardization-and-the-parametric-g-formula.html#cb19-57" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb19-58"><a href="standardization-and-the-parametric-g-formula.html#cb19-58" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb19-59"><a href="standardization-and-the-parametric-g-formula.html#cb19-59" tabindex="-1"></a>nhefs<span class="sc">$</span>predicted.meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit, nhefs)</span>
-<span id="cb19-60"><a href="standardization-and-the-parametric-g-formula.html#cb19-60" tabindex="-1"></a></span>
-<span id="cb19-61"><a href="standardization-and-the-parametric-g-formula.html#cb19-61" tabindex="-1"></a>nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>seqn <span class="sc">==</span> <span class="dv">24770</span>), <span class="fu">c</span>(</span>
-<span id="cb19-62"><a href="standardization-and-the-parametric-g-formula.html#cb19-62" tabindex="-1"></a>  <span class="st">&quot;predicted.meanY&quot;</span>,</span>
-<span id="cb19-63"><a href="standardization-and-the-parametric-g-formula.html#cb19-63" tabindex="-1"></a>  <span class="st">&quot;qsmk&quot;</span>,</span>
-<span id="cb19-64"><a href="standardization-and-the-parametric-g-formula.html#cb19-64" tabindex="-1"></a>  <span class="st">&quot;sex&quot;</span>,</span>
-<span id="cb19-65"><a href="standardization-and-the-parametric-g-formula.html#cb19-65" tabindex="-1"></a>  <span class="st">&quot;race&quot;</span>,</span>
-<span id="cb19-66"><a href="standardization-and-the-parametric-g-formula.html#cb19-66" tabindex="-1"></a>  <span class="st">&quot;age&quot;</span>,</span>
-<span id="cb19-67"><a href="standardization-and-the-parametric-g-formula.html#cb19-67" tabindex="-1"></a>  <span class="st">&quot;education&quot;</span>,</span>
-<span id="cb19-68"><a href="standardization-and-the-parametric-g-formula.html#cb19-68" tabindex="-1"></a>  <span class="st">&quot;smokeintensity&quot;</span>,</span>
-<span id="cb19-69"><a href="standardization-and-the-parametric-g-formula.html#cb19-69" tabindex="-1"></a>  <span class="st">&quot;smokeyrs&quot;</span>,</span>
-<span id="cb19-70"><a href="standardization-and-the-parametric-g-formula.html#cb19-70" tabindex="-1"></a>  <span class="st">&quot;exercise&quot;</span>,</span>
-<span id="cb19-71"><a href="standardization-and-the-parametric-g-formula.html#cb19-71" tabindex="-1"></a>  <span class="st">&quot;active&quot;</span>,</span>
-<span id="cb19-72"><a href="standardization-and-the-parametric-g-formula.html#cb19-72" tabindex="-1"></a>  <span class="st">&quot;wt71&quot;</span></span>
-<span id="cb19-73"><a href="standardization-and-the-parametric-g-formula.html#cb19-73" tabindex="-1"></a>)]</span>
-<span id="cb19-74"><a href="standardization-and-the-parametric-g-formula.html#cb19-74" tabindex="-1"></a><span class="co">#&gt; # A tibble: 1 × 11</span></span>
-<span id="cb19-75"><a href="standardization-and-the-parametric-g-formula.html#cb19-75" tabindex="-1"></a><span class="co">#&gt;   predicted.meanY  qsmk   sex  race   age education smokeintensity smokeyrs</span></span>
-<span id="cb19-76"><a href="standardization-and-the-parametric-g-formula.html#cb19-76" tabindex="-1"></a><span class="co">#&gt;             &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt;     &lt;dbl&gt;          &lt;dbl&gt;    &lt;dbl&gt;</span></span>
-<span id="cb19-77"><a href="standardization-and-the-parametric-g-formula.html#cb19-77" tabindex="-1"></a><span class="co">#&gt; 1           0.342     0     0     0    26         4             15       12</span></span>
-<span id="cb19-78"><a href="standardization-and-the-parametric-g-formula.html#cb19-78" tabindex="-1"></a><span class="co">#&gt; # ℹ 3 more variables: exercise &lt;dbl&gt;, active &lt;dbl&gt;, wt71 &lt;dbl&gt;</span></span>
-<span id="cb19-79"><a href="standardization-and-the-parametric-g-formula.html#cb19-79" tabindex="-1"></a></span>
-<span id="cb19-80"><a href="standardization-and-the-parametric-g-formula.html#cb19-80" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>predicted.meanY[nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>])</span>
-<span id="cb19-81"><a href="standardization-and-the-parametric-g-formula.html#cb19-81" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb19-82"><a href="standardization-and-the-parametric-g-formula.html#cb19-82" tabindex="-1"></a><span class="co">#&gt; -10.876   1.116   3.042   2.638   4.511   9.876</span></span>
-<span id="cb19-83"><a href="standardization-and-the-parametric-g-formula.html#cb19-83" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>wt82_71[nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>])</span>
-<span id="cb19-84"><a href="standardization-and-the-parametric-g-formula.html#cb19-84" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb19-85"><a href="standardization-and-the-parametric-g-formula.html#cb19-85" tabindex="-1"></a><span class="co">#&gt; -41.280  -1.478   2.604   2.638   6.690  48.538</span></span></code></pre></div>
+<div class="sourceCode" id="cb82"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb82-1"><a href="standardization-and-the-parametric-g-formula.html#cb82-1" tabindex="-1"></a><span class="fu">library</span>(here)</span></code></pre></div>
+<div class="sourceCode" id="cb83"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb83-1"><a href="standardization-and-the-parametric-g-formula.html#cb83-1" tabindex="-1"></a><span class="co"># install.packages(&quot;readxl&quot;) # install package if required</span></span>
+<span id="cb83-2"><a href="standardization-and-the-parametric-g-formula.html#cb83-2" tabindex="-1"></a><span class="fu">library</span>(<span class="st">&quot;readxl&quot;</span>)</span>
+<span id="cb83-3"><a href="standardization-and-the-parametric-g-formula.html#cb83-3" tabindex="-1"></a>nhefs <span class="ot">&lt;-</span> <span class="fu">read_excel</span>(<span class="fu">here</span>(<span class="st">&quot;data&quot;</span>, <span class="st">&quot;NHEFS.xls&quot;</span>))</span>
+<span id="cb83-4"><a href="standardization-and-the-parametric-g-formula.html#cb83-4" tabindex="-1"></a></span>
+<span id="cb83-5"><a href="standardization-and-the-parametric-g-formula.html#cb83-5" tabindex="-1"></a><span class="co"># some preprocessing of the data</span></span>
+<span id="cb83-6"><a href="standardization-and-the-parametric-g-formula.html#cb83-6" tabindex="-1"></a>nhefs<span class="sc">$</span>cens <span class="ot">&lt;-</span> <span class="fu">ifelse</span>(<span class="fu">is.na</span>(nhefs<span class="sc">$</span>wt82), <span class="dv">1</span>, <span class="dv">0</span>)</span>
+<span id="cb83-7"><a href="standardization-and-the-parametric-g-formula.html#cb83-7" tabindex="-1"></a></span>
+<span id="cb83-8"><a href="standardization-and-the-parametric-g-formula.html#cb83-8" tabindex="-1"></a>fit <span class="ot">&lt;-</span></span>
+<span id="cb83-9"><a href="standardization-and-the-parametric-g-formula.html#cb83-9" tabindex="-1"></a>  <span class="fu">glm</span>(</span>
+<span id="cb83-10"><a href="standardization-and-the-parametric-g-formula.html#cb83-10" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age) <span class="sc">+</span> <span class="fu">as.factor</span>(education)</span>
+<span id="cb83-11"><a href="standardization-and-the-parametric-g-formula.html#cb83-11" tabindex="-1"></a>    <span class="sc">+</span> smokeintensity <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb83-12"><a href="standardization-and-the-parametric-g-formula.html#cb83-12" tabindex="-1"></a>    <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span> smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active)</span>
+<span id="cb83-13"><a href="standardization-and-the-parametric-g-formula.html#cb83-13" tabindex="-1"></a>    <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span> wt71) <span class="sc">+</span> qsmk <span class="sc">*</span> smokeintensity,</span>
+<span id="cb83-14"><a href="standardization-and-the-parametric-g-formula.html#cb83-14" tabindex="-1"></a>    <span class="at">data =</span> nhefs</span>
+<span id="cb83-15"><a href="standardization-and-the-parametric-g-formula.html#cb83-15" tabindex="-1"></a>  )</span>
+<span id="cb83-16"><a href="standardization-and-the-parametric-g-formula.html#cb83-16" tabindex="-1"></a><span class="fu">summary</span>(fit)</span>
+<span id="cb83-17"><a href="standardization-and-the-parametric-g-formula.html#cb83-17" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb83-18"><a href="standardization-and-the-parametric-g-formula.html#cb83-18" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb83-19"><a href="standardization-and-the-parametric-g-formula.html#cb83-19" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb83-20"><a href="standardization-and-the-parametric-g-formula.html#cb83-20" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb83-21"><a href="standardization-and-the-parametric-g-formula.html#cb83-21" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb83-22"><a href="standardization-and-the-parametric-g-formula.html#cb83-22" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + qsmk * smokeintensity, </span></span>
+<span id="cb83-23"><a href="standardization-and-the-parametric-g-formula.html#cb83-23" tabindex="-1"></a><span class="co">#&gt;     data = nhefs)</span></span>
+<span id="cb83-24"><a href="standardization-and-the-parametric-g-formula.html#cb83-24" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb83-25"><a href="standardization-and-the-parametric-g-formula.html#cb83-25" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb83-26"><a href="standardization-and-the-parametric-g-formula.html#cb83-26" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb83-27"><a href="standardization-and-the-parametric-g-formula.html#cb83-27" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
+<span id="cb83-28"><a href="standardization-and-the-parametric-g-formula.html#cb83-28" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
+<span id="cb83-29"><a href="standardization-and-the-parametric-g-formula.html#cb83-29" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
+<span id="cb83-30"><a href="standardization-and-the-parametric-g-formula.html#cb83-30" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
+<span id="cb83-31"><a href="standardization-and-the-parametric-g-formula.html#cb83-31" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
+<span id="cb83-32"><a href="standardization-and-the-parametric-g-formula.html#cb83-32" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
+<span id="cb83-33"><a href="standardization-and-the-parametric-g-formula.html#cb83-33" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
+<span id="cb83-34"><a href="standardization-and-the-parametric-g-formula.html#cb83-34" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
+<span id="cb83-35"><a href="standardization-and-the-parametric-g-formula.html#cb83-35" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
+<span id="cb83-36"><a href="standardization-and-the-parametric-g-formula.html#cb83-36" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
+<span id="cb83-37"><a href="standardization-and-the-parametric-g-formula.html#cb83-37" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
+<span id="cb83-38"><a href="standardization-and-the-parametric-g-formula.html#cb83-38" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
+<span id="cb83-39"><a href="standardization-and-the-parametric-g-formula.html#cb83-39" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
+<span id="cb83-40"><a href="standardization-and-the-parametric-g-formula.html#cb83-40" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
+<span id="cb83-41"><a href="standardization-and-the-parametric-g-formula.html#cb83-41" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
+<span id="cb83-42"><a href="standardization-and-the-parametric-g-formula.html#cb83-42" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
+<span id="cb83-43"><a href="standardization-and-the-parametric-g-formula.html#cb83-43" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
+<span id="cb83-44"><a href="standardization-and-the-parametric-g-formula.html#cb83-44" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
+<span id="cb83-45"><a href="standardization-and-the-parametric-g-formula.html#cb83-45" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
+<span id="cb83-46"><a href="standardization-and-the-parametric-g-formula.html#cb83-46" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
+<span id="cb83-47"><a href="standardization-and-the-parametric-g-formula.html#cb83-47" tabindex="-1"></a><span class="co">#&gt; qsmk:smokeintensity                 0.0466628  0.0351448   1.328 0.184463    </span></span>
+<span id="cb83-48"><a href="standardization-and-the-parametric-g-formula.html#cb83-48" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb83-49"><a href="standardization-and-the-parametric-g-formula.html#cb83-49" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb83-50"><a href="standardization-and-the-parametric-g-formula.html#cb83-50" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb83-51"><a href="standardization-and-the-parametric-g-formula.html#cb83-51" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
+<span id="cb83-52"><a href="standardization-and-the-parametric-g-formula.html#cb83-52" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb83-53"><a href="standardization-and-the-parametric-g-formula.html#cb83-53" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb83-54"><a href="standardization-and-the-parametric-g-formula.html#cb83-54" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
+<span id="cb83-55"><a href="standardization-and-the-parametric-g-formula.html#cb83-55" tabindex="-1"></a><span class="co">#&gt;   (63 observations deleted due to missingness)</span></span>
+<span id="cb83-56"><a href="standardization-and-the-parametric-g-formula.html#cb83-56" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
+<span id="cb83-57"><a href="standardization-and-the-parametric-g-formula.html#cb83-57" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb83-58"><a href="standardization-and-the-parametric-g-formula.html#cb83-58" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb84"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb84-1"><a href="standardization-and-the-parametric-g-formula.html#cb84-1" tabindex="-1"></a>nhefs<span class="sc">$</span>predicted.meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit, nhefs)</span>
+<span id="cb84-2"><a href="standardization-and-the-parametric-g-formula.html#cb84-2" tabindex="-1"></a></span>
+<span id="cb84-3"><a href="standardization-and-the-parametric-g-formula.html#cb84-3" tabindex="-1"></a>nhefs[<span class="fu">which</span>(nhefs<span class="sc">$</span>seqn <span class="sc">==</span> <span class="dv">24770</span>), <span class="fu">c</span>(</span>
+<span id="cb84-4"><a href="standardization-and-the-parametric-g-formula.html#cb84-4" tabindex="-1"></a>  <span class="st">&quot;predicted.meanY&quot;</span>,</span>
+<span id="cb84-5"><a href="standardization-and-the-parametric-g-formula.html#cb84-5" tabindex="-1"></a>  <span class="st">&quot;qsmk&quot;</span>,</span>
+<span id="cb84-6"><a href="standardization-and-the-parametric-g-formula.html#cb84-6" tabindex="-1"></a>  <span class="st">&quot;sex&quot;</span>,</span>
+<span id="cb84-7"><a href="standardization-and-the-parametric-g-formula.html#cb84-7" tabindex="-1"></a>  <span class="st">&quot;race&quot;</span>,</span>
+<span id="cb84-8"><a href="standardization-and-the-parametric-g-formula.html#cb84-8" tabindex="-1"></a>  <span class="st">&quot;age&quot;</span>,</span>
+<span id="cb84-9"><a href="standardization-and-the-parametric-g-formula.html#cb84-9" tabindex="-1"></a>  <span class="st">&quot;education&quot;</span>,</span>
+<span id="cb84-10"><a href="standardization-and-the-parametric-g-formula.html#cb84-10" tabindex="-1"></a>  <span class="st">&quot;smokeintensity&quot;</span>,</span>
+<span id="cb84-11"><a href="standardization-and-the-parametric-g-formula.html#cb84-11" tabindex="-1"></a>  <span class="st">&quot;smokeyrs&quot;</span>,</span>
+<span id="cb84-12"><a href="standardization-and-the-parametric-g-formula.html#cb84-12" tabindex="-1"></a>  <span class="st">&quot;exercise&quot;</span>,</span>
+<span id="cb84-13"><a href="standardization-and-the-parametric-g-formula.html#cb84-13" tabindex="-1"></a>  <span class="st">&quot;active&quot;</span>,</span>
+<span id="cb84-14"><a href="standardization-and-the-parametric-g-formula.html#cb84-14" tabindex="-1"></a>  <span class="st">&quot;wt71&quot;</span></span>
+<span id="cb84-15"><a href="standardization-and-the-parametric-g-formula.html#cb84-15" tabindex="-1"></a>)]</span>
+<span id="cb84-16"><a href="standardization-and-the-parametric-g-formula.html#cb84-16" tabindex="-1"></a><span class="co">#&gt; # A tibble: 1 × 11</span></span>
+<span id="cb84-17"><a href="standardization-and-the-parametric-g-formula.html#cb84-17" tabindex="-1"></a><span class="co">#&gt;   predicted.meanY  qsmk   sex  race   age education smokeintensity smokeyrs</span></span>
+<span id="cb84-18"><a href="standardization-and-the-parametric-g-formula.html#cb84-18" tabindex="-1"></a><span class="co">#&gt;             &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt; &lt;dbl&gt;     &lt;dbl&gt;          &lt;dbl&gt;    &lt;dbl&gt;</span></span>
+<span id="cb84-19"><a href="standardization-and-the-parametric-g-formula.html#cb84-19" tabindex="-1"></a><span class="co">#&gt; 1           0.342     0     0     0    26         4             15       12</span></span>
+<span id="cb84-20"><a href="standardization-and-the-parametric-g-formula.html#cb84-20" tabindex="-1"></a><span class="co">#&gt; # ℹ 3 more variables: exercise &lt;dbl&gt;, active &lt;dbl&gt;, wt71 &lt;dbl&gt;</span></span></code></pre></div>
+<div class="sourceCode" id="cb85"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb85-1"><a href="standardization-and-the-parametric-g-formula.html#cb85-1" tabindex="-1"></a></span>
+<span id="cb85-2"><a href="standardization-and-the-parametric-g-formula.html#cb85-2" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>predicted.meanY[nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>])</span>
+<span id="cb85-3"><a href="standardization-and-the-parametric-g-formula.html#cb85-3" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb85-4"><a href="standardization-and-the-parametric-g-formula.html#cb85-4" tabindex="-1"></a><span class="co">#&gt; -10.876   1.116   3.042   2.638   4.511   9.876</span></span></code></pre></div>
+<div class="sourceCode" id="cb86"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb86-1"><a href="standardization-and-the-parametric-g-formula.html#cb86-1" tabindex="-1"></a><span class="fu">summary</span>(nhefs<span class="sc">$</span>wt82_71[nhefs<span class="sc">$</span>cens <span class="sc">==</span> <span class="dv">0</span>])</span>
+<span id="cb86-2"><a href="standardization-and-the-parametric-g-formula.html#cb86-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb86-3"><a href="standardization-and-the-parametric-g-formula.html#cb86-3" tabindex="-1"></a><span class="co">#&gt; -41.280  -1.478   2.604   2.638   6.690  48.538</span></span></code></pre></div>
 </div>
 <div id="program-13.2" class="section level2 hasAnchor">
 <h2>Program 13.2<a href="standardization-and-the-parametric-g-formula.html#program-13.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -409,68 +409,68 @@ <h2>Program 13.2<a href="standardization-and-the-parametric-g-formula.html#progr
 <li>Standardizing the mean outcome to the baseline confounders</li>
 <li>Data from Table 2.2</li>
 </ul>
-<div class="sourceCode" id="cb20"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb20-1"><a href="standardization-and-the-parametric-g-formula.html#cb20-1" tabindex="-1"></a>id <span class="ot">&lt;-</span> <span class="fu">c</span>(</span>
-<span id="cb20-2"><a href="standardization-and-the-parametric-g-formula.html#cb20-2" tabindex="-1"></a>  <span class="st">&quot;Rheia&quot;</span>,</span>
-<span id="cb20-3"><a href="standardization-and-the-parametric-g-formula.html#cb20-3" tabindex="-1"></a>  <span class="st">&quot;Kronos&quot;</span>,</span>
-<span id="cb20-4"><a href="standardization-and-the-parametric-g-formula.html#cb20-4" tabindex="-1"></a>  <span class="st">&quot;Demeter&quot;</span>,</span>
-<span id="cb20-5"><a href="standardization-and-the-parametric-g-formula.html#cb20-5" tabindex="-1"></a>  <span class="st">&quot;Hades&quot;</span>,</span>
-<span id="cb20-6"><a href="standardization-and-the-parametric-g-formula.html#cb20-6" tabindex="-1"></a>  <span class="st">&quot;Hestia&quot;</span>,</span>
-<span id="cb20-7"><a href="standardization-and-the-parametric-g-formula.html#cb20-7" tabindex="-1"></a>  <span class="st">&quot;Poseidon&quot;</span>,</span>
-<span id="cb20-8"><a href="standardization-and-the-parametric-g-formula.html#cb20-8" tabindex="-1"></a>  <span class="st">&quot;Hera&quot;</span>,</span>
-<span id="cb20-9"><a href="standardization-and-the-parametric-g-formula.html#cb20-9" tabindex="-1"></a>  <span class="st">&quot;Zeus&quot;</span>,</span>
-<span id="cb20-10"><a href="standardization-and-the-parametric-g-formula.html#cb20-10" tabindex="-1"></a>  <span class="st">&quot;Artemis&quot;</span>,</span>
-<span id="cb20-11"><a href="standardization-and-the-parametric-g-formula.html#cb20-11" tabindex="-1"></a>  <span class="st">&quot;Apollo&quot;</span>,</span>
-<span id="cb20-12"><a href="standardization-and-the-parametric-g-formula.html#cb20-12" tabindex="-1"></a>  <span class="st">&quot;Leto&quot;</span>,</span>
-<span id="cb20-13"><a href="standardization-and-the-parametric-g-formula.html#cb20-13" tabindex="-1"></a>  <span class="st">&quot;Ares&quot;</span>,</span>
-<span id="cb20-14"><a href="standardization-and-the-parametric-g-formula.html#cb20-14" tabindex="-1"></a>  <span class="st">&quot;Athena&quot;</span>,</span>
-<span id="cb20-15"><a href="standardization-and-the-parametric-g-formula.html#cb20-15" tabindex="-1"></a>  <span class="st">&quot;Hephaestus&quot;</span>,</span>
-<span id="cb20-16"><a href="standardization-and-the-parametric-g-formula.html#cb20-16" tabindex="-1"></a>  <span class="st">&quot;Aphrodite&quot;</span>,</span>
-<span id="cb20-17"><a href="standardization-and-the-parametric-g-formula.html#cb20-17" tabindex="-1"></a>  <span class="st">&quot;Cyclope&quot;</span>,</span>
-<span id="cb20-18"><a href="standardization-and-the-parametric-g-formula.html#cb20-18" tabindex="-1"></a>  <span class="st">&quot;Persephone&quot;</span>,</span>
-<span id="cb20-19"><a href="standardization-and-the-parametric-g-formula.html#cb20-19" tabindex="-1"></a>  <span class="st">&quot;Hermes&quot;</span>,</span>
-<span id="cb20-20"><a href="standardization-and-the-parametric-g-formula.html#cb20-20" tabindex="-1"></a>  <span class="st">&quot;Hebe&quot;</span>,</span>
-<span id="cb20-21"><a href="standardization-and-the-parametric-g-formula.html#cb20-21" tabindex="-1"></a>  <span class="st">&quot;Dionysus&quot;</span></span>
-<span id="cb20-22"><a href="standardization-and-the-parametric-g-formula.html#cb20-22" tabindex="-1"></a>)</span>
-<span id="cb20-23"><a href="standardization-and-the-parametric-g-formula.html#cb20-23" tabindex="-1"></a>N <span class="ot">&lt;-</span> <span class="fu">length</span>(id)</span>
-<span id="cb20-24"><a href="standardization-and-the-parametric-g-formula.html#cb20-24" tabindex="-1"></a>L <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>)</span>
-<span id="cb20-25"><a href="standardization-and-the-parametric-g-formula.html#cb20-25" tabindex="-1"></a>A <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>)</span>
-<span id="cb20-26"><a href="standardization-and-the-parametric-g-formula.html#cb20-26" tabindex="-1"></a>Y <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>)</span>
-<span id="cb20-27"><a href="standardization-and-the-parametric-g-formula.html#cb20-27" tabindex="-1"></a>interv <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="sc">-</span><span class="dv">1</span>, N)</span>
-<span id="cb20-28"><a href="standardization-and-the-parametric-g-formula.html#cb20-28" tabindex="-1"></a>observed <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, A, Y, interv)</span>
-<span id="cb20-29"><a href="standardization-and-the-parametric-g-formula.html#cb20-29" tabindex="-1"></a>untreated <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, <span class="fu">rep</span>(<span class="dv">0</span>, N), <span class="fu">rep</span>(<span class="cn">NA</span>, N), <span class="fu">rep</span>(<span class="dv">0</span>, N))</span>
-<span id="cb20-30"><a href="standardization-and-the-parametric-g-formula.html#cb20-30" tabindex="-1"></a>treated <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, <span class="fu">rep</span>(<span class="dv">1</span>, N), <span class="fu">rep</span>(<span class="cn">NA</span>, N), <span class="fu">rep</span>(<span class="dv">1</span>, N))</span>
-<span id="cb20-31"><a href="standardization-and-the-parametric-g-formula.html#cb20-31" tabindex="-1"></a>table22 <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(<span class="fu">rbind</span>(observed, untreated, treated))</span>
-<span id="cb20-32"><a href="standardization-and-the-parametric-g-formula.html#cb20-32" tabindex="-1"></a>table22<span class="sc">$</span>id <span class="ot">&lt;-</span> <span class="fu">rep</span>(id, <span class="dv">3</span>)</span>
-<span id="cb20-33"><a href="standardization-and-the-parametric-g-formula.html#cb20-33" tabindex="-1"></a></span>
-<span id="cb20-34"><a href="standardization-and-the-parametric-g-formula.html#cb20-34" tabindex="-1"></a>glm.obj <span class="ot">&lt;-</span> <span class="fu">glm</span>(Y <span class="sc">~</span> A <span class="sc">*</span> L, <span class="at">data =</span> table22)</span>
-<span id="cb20-35"><a href="standardization-and-the-parametric-g-formula.html#cb20-35" tabindex="-1"></a><span class="fu">summary</span>(glm.obj)</span>
-<span id="cb20-36"><a href="standardization-and-the-parametric-g-formula.html#cb20-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb20-37"><a href="standardization-and-the-parametric-g-formula.html#cb20-37" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb20-38"><a href="standardization-and-the-parametric-g-formula.html#cb20-38" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y ~ A * L, data = table22)</span></span>
-<span id="cb20-39"><a href="standardization-and-the-parametric-g-formula.html#cb20-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb20-40"><a href="standardization-and-the-parametric-g-formula.html#cb20-40" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb20-41"><a href="standardization-and-the-parametric-g-formula.html#cb20-41" tabindex="-1"></a><span class="co">#&gt;               Estimate Std. Error t value Pr(&gt;|t|)</span></span>
-<span id="cb20-42"><a href="standardization-and-the-parametric-g-formula.html#cb20-42" tabindex="-1"></a><span class="co">#&gt; (Intercept)  2.500e-01  2.552e-01   0.980    0.342</span></span>
-<span id="cb20-43"><a href="standardization-and-the-parametric-g-formula.html#cb20-43" tabindex="-1"></a><span class="co">#&gt; A            3.957e-17  3.608e-01   0.000    1.000</span></span>
-<span id="cb20-44"><a href="standardization-and-the-parametric-g-formula.html#cb20-44" tabindex="-1"></a><span class="co">#&gt; L            4.167e-01  3.898e-01   1.069    0.301</span></span>
-<span id="cb20-45"><a href="standardization-and-the-parametric-g-formula.html#cb20-45" tabindex="-1"></a><span class="co">#&gt; A:L         -1.313e-16  4.959e-01   0.000    1.000</span></span>
-<span id="cb20-46"><a href="standardization-and-the-parametric-g-formula.html#cb20-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb20-47"><a href="standardization-and-the-parametric-g-formula.html#cb20-47" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 0.2604167)</span></span>
-<span id="cb20-48"><a href="standardization-and-the-parametric-g-formula.html#cb20-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb20-49"><a href="standardization-and-the-parametric-g-formula.html#cb20-49" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 5.0000  on 19  degrees of freedom</span></span>
-<span id="cb20-50"><a href="standardization-and-the-parametric-g-formula.html#cb20-50" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4.1667  on 16  degrees of freedom</span></span>
-<span id="cb20-51"><a href="standardization-and-the-parametric-g-formula.html#cb20-51" tabindex="-1"></a><span class="co">#&gt;   (40 observations deleted due to missingness)</span></span>
-<span id="cb20-52"><a href="standardization-and-the-parametric-g-formula.html#cb20-52" tabindex="-1"></a><span class="co">#&gt; AIC: 35.385</span></span>
-<span id="cb20-53"><a href="standardization-and-the-parametric-g-formula.html#cb20-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb20-54"><a href="standardization-and-the-parametric-g-formula.html#cb20-54" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb20-55"><a href="standardization-and-the-parametric-g-formula.html#cb20-55" tabindex="-1"></a>table22<span class="sc">$</span>predicted.meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(glm.obj, table22)</span>
-<span id="cb20-56"><a href="standardization-and-the-parametric-g-formula.html#cb20-56" tabindex="-1"></a></span>
-<span id="cb20-57"><a href="standardization-and-the-parametric-g-formula.html#cb20-57" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>])</span>
-<span id="cb20-58"><a href="standardization-and-the-parametric-g-formula.html#cb20-58" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span>
-<span id="cb20-59"><a href="standardization-and-the-parametric-g-formula.html#cb20-59" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>])</span>
-<span id="cb20-60"><a href="standardization-and-the-parametric-g-formula.html#cb20-60" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span>
-<span id="cb20-61"><a href="standardization-and-the-parametric-g-formula.html#cb20-61" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>])</span>
-<span id="cb20-62"><a href="standardization-and-the-parametric-g-formula.html#cb20-62" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span></code></pre></div>
+<div class="sourceCode" id="cb87"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb87-1"><a href="standardization-and-the-parametric-g-formula.html#cb87-1" tabindex="-1"></a>id <span class="ot">&lt;-</span> <span class="fu">c</span>(</span>
+<span id="cb87-2"><a href="standardization-and-the-parametric-g-formula.html#cb87-2" tabindex="-1"></a>  <span class="st">&quot;Rheia&quot;</span>,</span>
+<span id="cb87-3"><a href="standardization-and-the-parametric-g-formula.html#cb87-3" tabindex="-1"></a>  <span class="st">&quot;Kronos&quot;</span>,</span>
+<span id="cb87-4"><a href="standardization-and-the-parametric-g-formula.html#cb87-4" tabindex="-1"></a>  <span class="st">&quot;Demeter&quot;</span>,</span>
+<span id="cb87-5"><a href="standardization-and-the-parametric-g-formula.html#cb87-5" tabindex="-1"></a>  <span class="st">&quot;Hades&quot;</span>,</span>
+<span id="cb87-6"><a href="standardization-and-the-parametric-g-formula.html#cb87-6" tabindex="-1"></a>  <span class="st">&quot;Hestia&quot;</span>,</span>
+<span id="cb87-7"><a href="standardization-and-the-parametric-g-formula.html#cb87-7" tabindex="-1"></a>  <span class="st">&quot;Poseidon&quot;</span>,</span>
+<span id="cb87-8"><a href="standardization-and-the-parametric-g-formula.html#cb87-8" tabindex="-1"></a>  <span class="st">&quot;Hera&quot;</span>,</span>
+<span id="cb87-9"><a href="standardization-and-the-parametric-g-formula.html#cb87-9" tabindex="-1"></a>  <span class="st">&quot;Zeus&quot;</span>,</span>
+<span id="cb87-10"><a href="standardization-and-the-parametric-g-formula.html#cb87-10" tabindex="-1"></a>  <span class="st">&quot;Artemis&quot;</span>,</span>
+<span id="cb87-11"><a href="standardization-and-the-parametric-g-formula.html#cb87-11" tabindex="-1"></a>  <span class="st">&quot;Apollo&quot;</span>,</span>
+<span id="cb87-12"><a href="standardization-and-the-parametric-g-formula.html#cb87-12" tabindex="-1"></a>  <span class="st">&quot;Leto&quot;</span>,</span>
+<span id="cb87-13"><a href="standardization-and-the-parametric-g-formula.html#cb87-13" tabindex="-1"></a>  <span class="st">&quot;Ares&quot;</span>,</span>
+<span id="cb87-14"><a href="standardization-and-the-parametric-g-formula.html#cb87-14" tabindex="-1"></a>  <span class="st">&quot;Athena&quot;</span>,</span>
+<span id="cb87-15"><a href="standardization-and-the-parametric-g-formula.html#cb87-15" tabindex="-1"></a>  <span class="st">&quot;Hephaestus&quot;</span>,</span>
+<span id="cb87-16"><a href="standardization-and-the-parametric-g-formula.html#cb87-16" tabindex="-1"></a>  <span class="st">&quot;Aphrodite&quot;</span>,</span>
+<span id="cb87-17"><a href="standardization-and-the-parametric-g-formula.html#cb87-17" tabindex="-1"></a>  <span class="st">&quot;Cyclope&quot;</span>,</span>
+<span id="cb87-18"><a href="standardization-and-the-parametric-g-formula.html#cb87-18" tabindex="-1"></a>  <span class="st">&quot;Persephone&quot;</span>,</span>
+<span id="cb87-19"><a href="standardization-and-the-parametric-g-formula.html#cb87-19" tabindex="-1"></a>  <span class="st">&quot;Hermes&quot;</span>,</span>
+<span id="cb87-20"><a href="standardization-and-the-parametric-g-formula.html#cb87-20" tabindex="-1"></a>  <span class="st">&quot;Hebe&quot;</span>,</span>
+<span id="cb87-21"><a href="standardization-and-the-parametric-g-formula.html#cb87-21" tabindex="-1"></a>  <span class="st">&quot;Dionysus&quot;</span></span>
+<span id="cb87-22"><a href="standardization-and-the-parametric-g-formula.html#cb87-22" tabindex="-1"></a>)</span>
+<span id="cb87-23"><a href="standardization-and-the-parametric-g-formula.html#cb87-23" tabindex="-1"></a>N <span class="ot">&lt;-</span> <span class="fu">length</span>(id)</span>
+<span id="cb87-24"><a href="standardization-and-the-parametric-g-formula.html#cb87-24" tabindex="-1"></a>L <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>)</span>
+<span id="cb87-25"><a href="standardization-and-the-parametric-g-formula.html#cb87-25" tabindex="-1"></a>A <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>)</span>
+<span id="cb87-26"><a href="standardization-and-the-parametric-g-formula.html#cb87-26" tabindex="-1"></a>Y <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>)</span>
+<span id="cb87-27"><a href="standardization-and-the-parametric-g-formula.html#cb87-27" tabindex="-1"></a>interv <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="sc">-</span><span class="dv">1</span>, N)</span>
+<span id="cb87-28"><a href="standardization-and-the-parametric-g-formula.html#cb87-28" tabindex="-1"></a>observed <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, A, Y, interv)</span>
+<span id="cb87-29"><a href="standardization-and-the-parametric-g-formula.html#cb87-29" tabindex="-1"></a>untreated <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, <span class="fu">rep</span>(<span class="dv">0</span>, N), <span class="fu">rep</span>(<span class="cn">NA</span>, N), <span class="fu">rep</span>(<span class="dv">0</span>, N))</span>
+<span id="cb87-30"><a href="standardization-and-the-parametric-g-formula.html#cb87-30" tabindex="-1"></a>treated <span class="ot">&lt;-</span> <span class="fu">cbind</span>(L, <span class="fu">rep</span>(<span class="dv">1</span>, N), <span class="fu">rep</span>(<span class="cn">NA</span>, N), <span class="fu">rep</span>(<span class="dv">1</span>, N))</span>
+<span id="cb87-31"><a href="standardization-and-the-parametric-g-formula.html#cb87-31" tabindex="-1"></a>table22 <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(<span class="fu">rbind</span>(observed, untreated, treated))</span>
+<span id="cb87-32"><a href="standardization-and-the-parametric-g-formula.html#cb87-32" tabindex="-1"></a>table22<span class="sc">$</span>id <span class="ot">&lt;-</span> <span class="fu">rep</span>(id, <span class="dv">3</span>)</span>
+<span id="cb87-33"><a href="standardization-and-the-parametric-g-formula.html#cb87-33" tabindex="-1"></a></span>
+<span id="cb87-34"><a href="standardization-and-the-parametric-g-formula.html#cb87-34" tabindex="-1"></a>glm.obj <span class="ot">&lt;-</span> <span class="fu">glm</span>(Y <span class="sc">~</span> A <span class="sc">*</span> L, <span class="at">data =</span> table22)</span>
+<span id="cb87-35"><a href="standardization-and-the-parametric-g-formula.html#cb87-35" tabindex="-1"></a><span class="fu">summary</span>(glm.obj)</span>
+<span id="cb87-36"><a href="standardization-and-the-parametric-g-formula.html#cb87-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb87-37"><a href="standardization-and-the-parametric-g-formula.html#cb87-37" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb87-38"><a href="standardization-and-the-parametric-g-formula.html#cb87-38" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y ~ A * L, data = table22)</span></span>
+<span id="cb87-39"><a href="standardization-and-the-parametric-g-formula.html#cb87-39" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb87-40"><a href="standardization-and-the-parametric-g-formula.html#cb87-40" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb87-41"><a href="standardization-and-the-parametric-g-formula.html#cb87-41" tabindex="-1"></a><span class="co">#&gt;               Estimate Std. Error t value Pr(&gt;|t|)</span></span>
+<span id="cb87-42"><a href="standardization-and-the-parametric-g-formula.html#cb87-42" tabindex="-1"></a><span class="co">#&gt; (Intercept)  2.500e-01  2.552e-01   0.980    0.342</span></span>
+<span id="cb87-43"><a href="standardization-and-the-parametric-g-formula.html#cb87-43" tabindex="-1"></a><span class="co">#&gt; A            3.957e-17  3.608e-01   0.000    1.000</span></span>
+<span id="cb87-44"><a href="standardization-and-the-parametric-g-formula.html#cb87-44" tabindex="-1"></a><span class="co">#&gt; L            4.167e-01  3.898e-01   1.069    0.301</span></span>
+<span id="cb87-45"><a href="standardization-and-the-parametric-g-formula.html#cb87-45" tabindex="-1"></a><span class="co">#&gt; A:L         -1.313e-16  4.959e-01   0.000    1.000</span></span>
+<span id="cb87-46"><a href="standardization-and-the-parametric-g-formula.html#cb87-46" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb87-47"><a href="standardization-and-the-parametric-g-formula.html#cb87-47" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 0.2604167)</span></span>
+<span id="cb87-48"><a href="standardization-and-the-parametric-g-formula.html#cb87-48" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb87-49"><a href="standardization-and-the-parametric-g-formula.html#cb87-49" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 5.0000  on 19  degrees of freedom</span></span>
+<span id="cb87-50"><a href="standardization-and-the-parametric-g-formula.html#cb87-50" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 4.1667  on 16  degrees of freedom</span></span>
+<span id="cb87-51"><a href="standardization-and-the-parametric-g-formula.html#cb87-51" tabindex="-1"></a><span class="co">#&gt;   (40 observations deleted due to missingness)</span></span>
+<span id="cb87-52"><a href="standardization-and-the-parametric-g-formula.html#cb87-52" tabindex="-1"></a><span class="co">#&gt; AIC: 35.385</span></span>
+<span id="cb87-53"><a href="standardization-and-the-parametric-g-formula.html#cb87-53" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb87-54"><a href="standardization-and-the-parametric-g-formula.html#cb87-54" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb88"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb88-1"><a href="standardization-and-the-parametric-g-formula.html#cb88-1" tabindex="-1"></a>table22<span class="sc">$</span>predicted.meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(glm.obj, table22)</span>
+<span id="cb88-2"><a href="standardization-and-the-parametric-g-formula.html#cb88-2" tabindex="-1"></a></span>
+<span id="cb88-3"><a href="standardization-and-the-parametric-g-formula.html#cb88-3" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>])</span>
+<span id="cb88-4"><a href="standardization-and-the-parametric-g-formula.html#cb88-4" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span></code></pre></div>
+<div class="sourceCode" id="cb89"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb89-1"><a href="standardization-and-the-parametric-g-formula.html#cb89-1" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>])</span>
+<span id="cb89-2"><a href="standardization-and-the-parametric-g-formula.html#cb89-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span></code></pre></div>
+<div class="sourceCode" id="cb90"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb90-1"><a href="standardization-and-the-parametric-g-formula.html#cb90-1" tabindex="-1"></a><span class="fu">mean</span>(table22<span class="sc">$</span>predicted.meanY[table22<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>])</span>
+<span id="cb90-2"><a href="standardization-and-the-parametric-g-formula.html#cb90-2" tabindex="-1"></a><span class="co">#&gt; [1] 0.5</span></span></code></pre></div>
 </div>
 <div id="program-13.3" class="section level2 hasAnchor">
 <h2>Program 13.3<a href="standardization-and-the-parametric-g-formula.html#program-13.3" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -478,88 +478,88 @@ <h2>Program 13.3<a href="standardization-and-the-parametric-g-formula.html#progr
 <li>Standardizing the mean outcome to the baseline confounders:</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb21"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb21-1"><a href="standardization-and-the-parametric-g-formula.html#cb21-1" tabindex="-1"></a><span class="co"># create a dataset with 3 copies of each subject</span></span>
-<span id="cb21-2"><a href="standardization-and-the-parametric-g-formula.html#cb21-2" tabindex="-1"></a>nhefs<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span> <span class="co"># 1st copy: equal to original one</span></span>
-<span id="cb21-3"><a href="standardization-and-the-parametric-g-formula.html#cb21-3" tabindex="-1"></a></span>
-<span id="cb21-4"><a href="standardization-and-the-parametric-g-formula.html#cb21-4" tabindex="-1"></a>interv0 <span class="ot">&lt;-</span> nhefs <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
-<span id="cb21-5"><a href="standardization-and-the-parametric-g-formula.html#cb21-5" tabindex="-1"></a>interv0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb21-6"><a href="standardization-and-the-parametric-g-formula.html#cb21-6" tabindex="-1"></a>interv0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb21-7"><a href="standardization-and-the-parametric-g-formula.html#cb21-7" tabindex="-1"></a>interv0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb21-8"><a href="standardization-and-the-parametric-g-formula.html#cb21-8" tabindex="-1"></a></span>
-<span id="cb21-9"><a href="standardization-and-the-parametric-g-formula.html#cb21-9" tabindex="-1"></a>interv1 <span class="ot">&lt;-</span> nhefs <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
-<span id="cb21-10"><a href="standardization-and-the-parametric-g-formula.html#cb21-10" tabindex="-1"></a>interv1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb21-11"><a href="standardization-and-the-parametric-g-formula.html#cb21-11" tabindex="-1"></a>interv1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb21-12"><a href="standardization-and-the-parametric-g-formula.html#cb21-12" tabindex="-1"></a>interv1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb21-13"><a href="standardization-and-the-parametric-g-formula.html#cb21-13" tabindex="-1"></a></span>
-<span id="cb21-14"><a href="standardization-and-the-parametric-g-formula.html#cb21-14" tabindex="-1"></a>onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(nhefs, interv0, interv1) <span class="co"># combining datasets</span></span>
-<span id="cb21-15"><a href="standardization-and-the-parametric-g-formula.html#cb21-15" tabindex="-1"></a></span>
-<span id="cb21-16"><a href="standardization-and-the-parametric-g-formula.html#cb21-16" tabindex="-1"></a><span class="co"># linear model to estimate mean outcome conditional on treatment and confounders</span></span>
-<span id="cb21-17"><a href="standardization-and-the-parametric-g-formula.html#cb21-17" tabindex="-1"></a><span class="co"># parameters are estimated using original observations only (nhefs)</span></span>
-<span id="cb21-18"><a href="standardization-and-the-parametric-g-formula.html#cb21-18" tabindex="-1"></a><span class="co"># parameter estimates are used to predict mean outcome for observations with</span></span>
-<span id="cb21-19"><a href="standardization-and-the-parametric-g-formula.html#cb21-19" tabindex="-1"></a><span class="co"># treatment set to 0 (interv=0) and to 1 (interv=1)</span></span>
-<span id="cb21-20"><a href="standardization-and-the-parametric-g-formula.html#cb21-20" tabindex="-1"></a></span>
-<span id="cb21-21"><a href="standardization-and-the-parametric-g-formula.html#cb21-21" tabindex="-1"></a>std <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
-<span id="cb21-22"><a href="standardization-and-the-parametric-g-formula.html#cb21-22" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age)</span>
-<span id="cb21-23"><a href="standardization-and-the-parametric-g-formula.html#cb21-23" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
-<span id="cb21-24"><a href="standardization-and-the-parametric-g-formula.html#cb21-24" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs</span>
-<span id="cb21-25"><a href="standardization-and-the-parametric-g-formula.html#cb21-25" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span> smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
-<span id="cb21-26"><a href="standardization-and-the-parametric-g-formula.html#cb21-26" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span> wt71) <span class="sc">+</span> <span class="fu">I</span>(qsmk <span class="sc">*</span> smokeintensity),</span>
-<span id="cb21-27"><a href="standardization-and-the-parametric-g-formula.html#cb21-27" tabindex="-1"></a>  <span class="at">data =</span> onesample</span>
-<span id="cb21-28"><a href="standardization-and-the-parametric-g-formula.html#cb21-28" tabindex="-1"></a>)</span>
-<span id="cb21-29"><a href="standardization-and-the-parametric-g-formula.html#cb21-29" tabindex="-1"></a><span class="fu">summary</span>(std)</span>
-<span id="cb21-30"><a href="standardization-and-the-parametric-g-formula.html#cb21-30" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb21-31"><a href="standardization-and-the-parametric-g-formula.html#cb21-31" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb21-32"><a href="standardization-and-the-parametric-g-formula.html#cb21-32" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
-<span id="cb21-33"><a href="standardization-and-the-parametric-g-formula.html#cb21-33" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
-<span id="cb21-34"><a href="standardization-and-the-parametric-g-formula.html#cb21-34" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
-<span id="cb21-35"><a href="standardization-and-the-parametric-g-formula.html#cb21-35" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
-<span id="cb21-36"><a href="standardization-and-the-parametric-g-formula.html#cb21-36" tabindex="-1"></a><span class="co">#&gt;     data = onesample)</span></span>
-<span id="cb21-37"><a href="standardization-and-the-parametric-g-formula.html#cb21-37" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb21-38"><a href="standardization-and-the-parametric-g-formula.html#cb21-38" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb21-39"><a href="standardization-and-the-parametric-g-formula.html#cb21-39" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb21-40"><a href="standardization-and-the-parametric-g-formula.html#cb21-40" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
-<span id="cb21-41"><a href="standardization-and-the-parametric-g-formula.html#cb21-41" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
-<span id="cb21-42"><a href="standardization-and-the-parametric-g-formula.html#cb21-42" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
-<span id="cb21-43"><a href="standardization-and-the-parametric-g-formula.html#cb21-43" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
-<span id="cb21-44"><a href="standardization-and-the-parametric-g-formula.html#cb21-44" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
-<span id="cb21-45"><a href="standardization-and-the-parametric-g-formula.html#cb21-45" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
-<span id="cb21-46"><a href="standardization-and-the-parametric-g-formula.html#cb21-46" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
-<span id="cb21-47"><a href="standardization-and-the-parametric-g-formula.html#cb21-47" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
-<span id="cb21-48"><a href="standardization-and-the-parametric-g-formula.html#cb21-48" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
-<span id="cb21-49"><a href="standardization-and-the-parametric-g-formula.html#cb21-49" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
-<span id="cb21-50"><a href="standardization-and-the-parametric-g-formula.html#cb21-50" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
-<span id="cb21-51"><a href="standardization-and-the-parametric-g-formula.html#cb21-51" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
-<span id="cb21-52"><a href="standardization-and-the-parametric-g-formula.html#cb21-52" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
-<span id="cb21-53"><a href="standardization-and-the-parametric-g-formula.html#cb21-53" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
-<span id="cb21-54"><a href="standardization-and-the-parametric-g-formula.html#cb21-54" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
-<span id="cb21-55"><a href="standardization-and-the-parametric-g-formula.html#cb21-55" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
-<span id="cb21-56"><a href="standardization-and-the-parametric-g-formula.html#cb21-56" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
-<span id="cb21-57"><a href="standardization-and-the-parametric-g-formula.html#cb21-57" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
-<span id="cb21-58"><a href="standardization-and-the-parametric-g-formula.html#cb21-58" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
-<span id="cb21-59"><a href="standardization-and-the-parametric-g-formula.html#cb21-59" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
-<span id="cb21-60"><a href="standardization-and-the-parametric-g-formula.html#cb21-60" tabindex="-1"></a><span class="co">#&gt; I(qsmk * smokeintensity)            0.0466628  0.0351448   1.328 0.184463    </span></span>
-<span id="cb21-61"><a href="standardization-and-the-parametric-g-formula.html#cb21-61" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb21-62"><a href="standardization-and-the-parametric-g-formula.html#cb21-62" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb21-63"><a href="standardization-and-the-parametric-g-formula.html#cb21-63" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb21-64"><a href="standardization-and-the-parametric-g-formula.html#cb21-64" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
-<span id="cb21-65"><a href="standardization-and-the-parametric-g-formula.html#cb21-65" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb21-66"><a href="standardization-and-the-parametric-g-formula.html#cb21-66" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
-<span id="cb21-67"><a href="standardization-and-the-parametric-g-formula.html#cb21-67" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
-<span id="cb21-68"><a href="standardization-and-the-parametric-g-formula.html#cb21-68" tabindex="-1"></a><span class="co">#&gt;   (3321 observations deleted due to missingness)</span></span>
-<span id="cb21-69"><a href="standardization-and-the-parametric-g-formula.html#cb21-69" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
-<span id="cb21-70"><a href="standardization-and-the-parametric-g-formula.html#cb21-70" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb21-71"><a href="standardization-and-the-parametric-g-formula.html#cb21-71" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb21-72"><a href="standardization-and-the-parametric-g-formula.html#cb21-72" tabindex="-1"></a>onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(std, onesample)</span>
-<span id="cb21-73"><a href="standardization-and-the-parametric-g-formula.html#cb21-73" tabindex="-1"></a></span>
-<span id="cb21-74"><a href="standardization-and-the-parametric-g-formula.html#cb21-74" tabindex="-1"></a><span class="co"># estimate mean outcome in each of the groups interv=0, and interv=1</span></span>
-<span id="cb21-75"><a href="standardization-and-the-parametric-g-formula.html#cb21-75" tabindex="-1"></a><span class="co"># this mean outcome is a weighted average of the mean outcomes in each combination</span></span>
-<span id="cb21-76"><a href="standardization-and-the-parametric-g-formula.html#cb21-76" tabindex="-1"></a><span class="co"># of values of treatment and confounders, that is, the standardized outcome</span></span>
-<span id="cb21-77"><a href="standardization-and-the-parametric-g-formula.html#cb21-77" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>), ]<span class="sc">$</span>predicted_meanY)</span>
-<span id="cb21-78"><a href="standardization-and-the-parametric-g-formula.html#cb21-78" tabindex="-1"></a><span class="co">#&gt; [1] 2.56319</span></span>
-<span id="cb21-79"><a href="standardization-and-the-parametric-g-formula.html#cb21-79" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>), ]<span class="sc">$</span>predicted_meanY)</span>
-<span id="cb21-80"><a href="standardization-and-the-parametric-g-formula.html#cb21-80" tabindex="-1"></a><span class="co">#&gt; [1] 1.660267</span></span>
-<span id="cb21-81"><a href="standardization-and-the-parametric-g-formula.html#cb21-81" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>), ]<span class="sc">$</span>predicted_meanY)</span>
-<span id="cb21-82"><a href="standardization-and-the-parametric-g-formula.html#cb21-82" tabindex="-1"></a><span class="co">#&gt; [1] 5.178841</span></span></code></pre></div>
+<div class="sourceCode" id="cb91"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb91-1"><a href="standardization-and-the-parametric-g-formula.html#cb91-1" tabindex="-1"></a><span class="co"># create a dataset with 3 copies of each subject</span></span>
+<span id="cb91-2"><a href="standardization-and-the-parametric-g-formula.html#cb91-2" tabindex="-1"></a>nhefs<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span> <span class="co"># 1st copy: equal to original one</span></span>
+<span id="cb91-3"><a href="standardization-and-the-parametric-g-formula.html#cb91-3" tabindex="-1"></a></span>
+<span id="cb91-4"><a href="standardization-and-the-parametric-g-formula.html#cb91-4" tabindex="-1"></a>interv0 <span class="ot">&lt;-</span> nhefs <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
+<span id="cb91-5"><a href="standardization-and-the-parametric-g-formula.html#cb91-5" tabindex="-1"></a>interv0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb91-6"><a href="standardization-and-the-parametric-g-formula.html#cb91-6" tabindex="-1"></a>interv0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb91-7"><a href="standardization-and-the-parametric-g-formula.html#cb91-7" tabindex="-1"></a>interv0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb91-8"><a href="standardization-and-the-parametric-g-formula.html#cb91-8" tabindex="-1"></a></span>
+<span id="cb91-9"><a href="standardization-and-the-parametric-g-formula.html#cb91-9" tabindex="-1"></a>interv1 <span class="ot">&lt;-</span> nhefs <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
+<span id="cb91-10"><a href="standardization-and-the-parametric-g-formula.html#cb91-10" tabindex="-1"></a>interv1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb91-11"><a href="standardization-and-the-parametric-g-formula.html#cb91-11" tabindex="-1"></a>interv1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb91-12"><a href="standardization-and-the-parametric-g-formula.html#cb91-12" tabindex="-1"></a>interv1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb91-13"><a href="standardization-and-the-parametric-g-formula.html#cb91-13" tabindex="-1"></a></span>
+<span id="cb91-14"><a href="standardization-and-the-parametric-g-formula.html#cb91-14" tabindex="-1"></a>onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(nhefs, interv0, interv1) <span class="co"># combining datasets</span></span>
+<span id="cb91-15"><a href="standardization-and-the-parametric-g-formula.html#cb91-15" tabindex="-1"></a></span>
+<span id="cb91-16"><a href="standardization-and-the-parametric-g-formula.html#cb91-16" tabindex="-1"></a><span class="co"># linear model to estimate mean outcome conditional on treatment and confounders</span></span>
+<span id="cb91-17"><a href="standardization-and-the-parametric-g-formula.html#cb91-17" tabindex="-1"></a><span class="co"># parameters are estimated using original observations only (nhefs)</span></span>
+<span id="cb91-18"><a href="standardization-and-the-parametric-g-formula.html#cb91-18" tabindex="-1"></a><span class="co"># parameter estimates are used to predict mean outcome for observations with</span></span>
+<span id="cb91-19"><a href="standardization-and-the-parametric-g-formula.html#cb91-19" tabindex="-1"></a><span class="co"># treatment set to 0 (interv=0) and to 1 (interv=1)</span></span>
+<span id="cb91-20"><a href="standardization-and-the-parametric-g-formula.html#cb91-20" tabindex="-1"></a></span>
+<span id="cb91-21"><a href="standardization-and-the-parametric-g-formula.html#cb91-21" tabindex="-1"></a>std <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
+<span id="cb91-22"><a href="standardization-and-the-parametric-g-formula.html#cb91-22" tabindex="-1"></a>  wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age)</span>
+<span id="cb91-23"><a href="standardization-and-the-parametric-g-formula.html#cb91-23" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity</span>
+<span id="cb91-24"><a href="standardization-and-the-parametric-g-formula.html#cb91-24" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs</span>
+<span id="cb91-25"><a href="standardization-and-the-parametric-g-formula.html#cb91-25" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span> smokeyrs) <span class="sc">+</span> <span class="fu">as.factor</span>(exercise)</span>
+<span id="cb91-26"><a href="standardization-and-the-parametric-g-formula.html#cb91-26" tabindex="-1"></a>  <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span> wt71) <span class="sc">+</span> <span class="fu">I</span>(qsmk <span class="sc">*</span> smokeintensity),</span>
+<span id="cb91-27"><a href="standardization-and-the-parametric-g-formula.html#cb91-27" tabindex="-1"></a>  <span class="at">data =</span> onesample</span>
+<span id="cb91-28"><a href="standardization-and-the-parametric-g-formula.html#cb91-28" tabindex="-1"></a>)</span>
+<span id="cb91-29"><a href="standardization-and-the-parametric-g-formula.html#cb91-29" tabindex="-1"></a><span class="fu">summary</span>(std)</span>
+<span id="cb91-30"><a href="standardization-and-the-parametric-g-formula.html#cb91-30" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb91-31"><a href="standardization-and-the-parametric-g-formula.html#cb91-31" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb91-32"><a href="standardization-and-the-parametric-g-formula.html#cb91-32" tabindex="-1"></a><span class="co">#&gt; glm(formula = wt82_71 ~ qsmk + sex + race + age + I(age * age) + </span></span>
+<span id="cb91-33"><a href="standardization-and-the-parametric-g-formula.html#cb91-33" tabindex="-1"></a><span class="co">#&gt;     as.factor(education) + smokeintensity + I(smokeintensity * </span></span>
+<span id="cb91-34"><a href="standardization-and-the-parametric-g-formula.html#cb91-34" tabindex="-1"></a><span class="co">#&gt;     smokeintensity) + smokeyrs + I(smokeyrs * smokeyrs) + as.factor(exercise) + </span></span>
+<span id="cb91-35"><a href="standardization-and-the-parametric-g-formula.html#cb91-35" tabindex="-1"></a><span class="co">#&gt;     as.factor(active) + wt71 + I(wt71 * wt71) + I(qsmk * smokeintensity), </span></span>
+<span id="cb91-36"><a href="standardization-and-the-parametric-g-formula.html#cb91-36" tabindex="-1"></a><span class="co">#&gt;     data = onesample)</span></span>
+<span id="cb91-37"><a href="standardization-and-the-parametric-g-formula.html#cb91-37" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb91-38"><a href="standardization-and-the-parametric-g-formula.html#cb91-38" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb91-39"><a href="standardization-and-the-parametric-g-formula.html#cb91-39" tabindex="-1"></a><span class="co">#&gt;                                      Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb91-40"><a href="standardization-and-the-parametric-g-formula.html#cb91-40" tabindex="-1"></a><span class="co">#&gt; (Intercept)                        -1.5881657  4.3130359  -0.368 0.712756    </span></span>
+<span id="cb91-41"><a href="standardization-and-the-parametric-g-formula.html#cb91-41" tabindex="-1"></a><span class="co">#&gt; qsmk                                2.5595941  0.8091486   3.163 0.001590 ** </span></span>
+<span id="cb91-42"><a href="standardization-and-the-parametric-g-formula.html#cb91-42" tabindex="-1"></a><span class="co">#&gt; sex                                -1.4302717  0.4689576  -3.050 0.002328 ** </span></span>
+<span id="cb91-43"><a href="standardization-and-the-parametric-g-formula.html#cb91-43" tabindex="-1"></a><span class="co">#&gt; race                                0.5601096  0.5818888   0.963 0.335913    </span></span>
+<span id="cb91-44"><a href="standardization-and-the-parametric-g-formula.html#cb91-44" tabindex="-1"></a><span class="co">#&gt; age                                 0.3596353  0.1633188   2.202 0.027809 *  </span></span>
+<span id="cb91-45"><a href="standardization-and-the-parametric-g-formula.html#cb91-45" tabindex="-1"></a><span class="co">#&gt; I(age * age)                       -0.0061010  0.0017261  -3.534 0.000421 ***</span></span>
+<span id="cb91-46"><a href="standardization-and-the-parametric-g-formula.html#cb91-46" tabindex="-1"></a><span class="co">#&gt; as.factor(education)2               0.7904440  0.6070005   1.302 0.193038    </span></span>
+<span id="cb91-47"><a href="standardization-and-the-parametric-g-formula.html#cb91-47" tabindex="-1"></a><span class="co">#&gt; as.factor(education)3               0.5563124  0.5561016   1.000 0.317284    </span></span>
+<span id="cb91-48"><a href="standardization-and-the-parametric-g-formula.html#cb91-48" tabindex="-1"></a><span class="co">#&gt; as.factor(education)4               1.4915695  0.8322704   1.792 0.073301 .  </span></span>
+<span id="cb91-49"><a href="standardization-and-the-parametric-g-formula.html#cb91-49" tabindex="-1"></a><span class="co">#&gt; as.factor(education)5              -0.1949770  0.7413692  -0.263 0.792589    </span></span>
+<span id="cb91-50"><a href="standardization-and-the-parametric-g-formula.html#cb91-50" tabindex="-1"></a><span class="co">#&gt; smokeintensity                      0.0491365  0.0517254   0.950 0.342287    </span></span>
+<span id="cb91-51"><a href="standardization-and-the-parametric-g-formula.html#cb91-51" tabindex="-1"></a><span class="co">#&gt; I(smokeintensity * smokeintensity) -0.0009907  0.0009380  -1.056 0.291097    </span></span>
+<span id="cb91-52"><a href="standardization-and-the-parametric-g-formula.html#cb91-52" tabindex="-1"></a><span class="co">#&gt; smokeyrs                            0.1343686  0.0917122   1.465 0.143094    </span></span>
+<span id="cb91-53"><a href="standardization-and-the-parametric-g-formula.html#cb91-53" tabindex="-1"></a><span class="co">#&gt; I(smokeyrs * smokeyrs)             -0.0018664  0.0015437  -1.209 0.226830    </span></span>
+<span id="cb91-54"><a href="standardization-and-the-parametric-g-formula.html#cb91-54" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)1                0.2959754  0.5351533   0.553 0.580298    </span></span>
+<span id="cb91-55"><a href="standardization-and-the-parametric-g-formula.html#cb91-55" tabindex="-1"></a><span class="co">#&gt; as.factor(exercise)2                0.3539128  0.5588587   0.633 0.526646    </span></span>
+<span id="cb91-56"><a href="standardization-and-the-parametric-g-formula.html#cb91-56" tabindex="-1"></a><span class="co">#&gt; as.factor(active)1                 -0.9475695  0.4099344  -2.312 0.020935 *  </span></span>
+<span id="cb91-57"><a href="standardization-and-the-parametric-g-formula.html#cb91-57" tabindex="-1"></a><span class="co">#&gt; as.factor(active)2                 -0.2613779  0.6845577  -0.382 0.702647    </span></span>
+<span id="cb91-58"><a href="standardization-and-the-parametric-g-formula.html#cb91-58" tabindex="-1"></a><span class="co">#&gt; wt71                                0.0455018  0.0833709   0.546 0.585299    </span></span>
+<span id="cb91-59"><a href="standardization-and-the-parametric-g-formula.html#cb91-59" tabindex="-1"></a><span class="co">#&gt; I(wt71 * wt71)                     -0.0009653  0.0005247  -1.840 0.066001 .  </span></span>
+<span id="cb91-60"><a href="standardization-and-the-parametric-g-formula.html#cb91-60" tabindex="-1"></a><span class="co">#&gt; I(qsmk * smokeintensity)            0.0466628  0.0351448   1.328 0.184463    </span></span>
+<span id="cb91-61"><a href="standardization-and-the-parametric-g-formula.html#cb91-61" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb91-62"><a href="standardization-and-the-parametric-g-formula.html#cb91-62" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb91-63"><a href="standardization-and-the-parametric-g-formula.html#cb91-63" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb91-64"><a href="standardization-and-the-parametric-g-formula.html#cb91-64" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 53.5683)</span></span>
+<span id="cb91-65"><a href="standardization-and-the-parametric-g-formula.html#cb91-65" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb91-66"><a href="standardization-and-the-parametric-g-formula.html#cb91-66" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 97176  on 1565  degrees of freedom</span></span>
+<span id="cb91-67"><a href="standardization-and-the-parametric-g-formula.html#cb91-67" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 82763  on 1545  degrees of freedom</span></span>
+<span id="cb91-68"><a href="standardization-and-the-parametric-g-formula.html#cb91-68" tabindex="-1"></a><span class="co">#&gt;   (3321 observations deleted due to missingness)</span></span>
+<span id="cb91-69"><a href="standardization-and-the-parametric-g-formula.html#cb91-69" tabindex="-1"></a><span class="co">#&gt; AIC: 10701</span></span>
+<span id="cb91-70"><a href="standardization-and-the-parametric-g-formula.html#cb91-70" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb91-71"><a href="standardization-and-the-parametric-g-formula.html#cb91-71" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb92"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb92-1"><a href="standardization-and-the-parametric-g-formula.html#cb92-1" tabindex="-1"></a>onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(std, onesample)</span>
+<span id="cb92-2"><a href="standardization-and-the-parametric-g-formula.html#cb92-2" tabindex="-1"></a></span>
+<span id="cb92-3"><a href="standardization-and-the-parametric-g-formula.html#cb92-3" tabindex="-1"></a><span class="co"># estimate mean outcome in each of the groups interv=0, and interv=1</span></span>
+<span id="cb92-4"><a href="standardization-and-the-parametric-g-formula.html#cb92-4" tabindex="-1"></a><span class="co"># this mean outcome is a weighted average of the mean outcomes in each combination</span></span>
+<span id="cb92-5"><a href="standardization-and-the-parametric-g-formula.html#cb92-5" tabindex="-1"></a><span class="co"># of values of treatment and confounders, that is, the standardized outcome</span></span>
+<span id="cb92-6"><a href="standardization-and-the-parametric-g-formula.html#cb92-6" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>), ]<span class="sc">$</span>predicted_meanY)</span>
+<span id="cb92-7"><a href="standardization-and-the-parametric-g-formula.html#cb92-7" tabindex="-1"></a><span class="co">#&gt; [1] 2.56319</span></span></code></pre></div>
+<div class="sourceCode" id="cb93"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb93-1"><a href="standardization-and-the-parametric-g-formula.html#cb93-1" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>), ]<span class="sc">$</span>predicted_meanY)</span>
+<span id="cb93-2"><a href="standardization-and-the-parametric-g-formula.html#cb93-2" tabindex="-1"></a><span class="co">#&gt; [1] 1.660267</span></span></code></pre></div>
+<div class="sourceCode" id="cb94"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb94-1"><a href="standardization-and-the-parametric-g-formula.html#cb94-1" tabindex="-1"></a><span class="fu">mean</span>(onesample[<span class="fu">which</span>(onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>), ]<span class="sc">$</span>predicted_meanY)</span>
+<span id="cb94-2"><a href="standardization-and-the-parametric-g-formula.html#cb94-2" tabindex="-1"></a><span class="co">#&gt; [1] 5.178841</span></span></code></pre></div>
 </div>
 <div id="program-13.4" class="section level2 hasAnchor">
 <h2>Program 13.4<a href="standardization-and-the-parametric-g-formula.html#program-13.4" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -567,88 +567,88 @@ <h2>Program 13.4<a href="standardization-and-the-parametric-g-formula.html#progr
 <li>Computing the 95% confidence interval of the standardized means and their difference</li>
 <li>Data from NHEFS</li>
 </ul>
-<div class="sourceCode" id="cb22"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb22-1"><a href="standardization-and-the-parametric-g-formula.html#cb22-1" tabindex="-1"></a><span class="co">#install.packages(&quot;boot&quot;) # install package if required</span></span>
-<span id="cb22-2"><a href="standardization-and-the-parametric-g-formula.html#cb22-2" tabindex="-1"></a><span class="fu">library</span>(boot)</span>
-<span id="cb22-3"><a href="standardization-and-the-parametric-g-formula.html#cb22-3" tabindex="-1"></a></span>
-<span id="cb22-4"><a href="standardization-and-the-parametric-g-formula.html#cb22-4" tabindex="-1"></a><span class="co"># function to calculate difference in means</span></span>
-<span id="cb22-5"><a href="standardization-and-the-parametric-g-formula.html#cb22-5" tabindex="-1"></a>standardization <span class="ot">&lt;-</span> <span class="cf">function</span>(data, indices) {</span>
-<span id="cb22-6"><a href="standardization-and-the-parametric-g-formula.html#cb22-6" tabindex="-1"></a>  <span class="co"># create a dataset with 3 copies of each subject</span></span>
-<span id="cb22-7"><a href="standardization-and-the-parametric-g-formula.html#cb22-7" tabindex="-1"></a>  d <span class="ot">&lt;-</span> data[indices, ] <span class="co"># 1st copy: equal to original one`</span></span>
-<span id="cb22-8"><a href="standardization-and-the-parametric-g-formula.html#cb22-8" tabindex="-1"></a>  d<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span></span>
-<span id="cb22-9"><a href="standardization-and-the-parametric-g-formula.html#cb22-9" tabindex="-1"></a>  d0 <span class="ot">&lt;-</span> d <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
-<span id="cb22-10"><a href="standardization-and-the-parametric-g-formula.html#cb22-10" tabindex="-1"></a>  d0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb22-11"><a href="standardization-and-the-parametric-g-formula.html#cb22-11" tabindex="-1"></a>  d0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb22-12"><a href="standardization-and-the-parametric-g-formula.html#cb22-12" tabindex="-1"></a>  d0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb22-13"><a href="standardization-and-the-parametric-g-formula.html#cb22-13" tabindex="-1"></a>  d1 <span class="ot">&lt;-</span> d <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
-<span id="cb22-14"><a href="standardization-and-the-parametric-g-formula.html#cb22-14" tabindex="-1"></a>  d1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb22-15"><a href="standardization-and-the-parametric-g-formula.html#cb22-15" tabindex="-1"></a>  d1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
-<span id="cb22-16"><a href="standardization-and-the-parametric-g-formula.html#cb22-16" tabindex="-1"></a>  d1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
-<span id="cb22-17"><a href="standardization-and-the-parametric-g-formula.html#cb22-17" tabindex="-1"></a>  d.onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(d, d0, d1) <span class="co"># combining datasets</span></span>
-<span id="cb22-18"><a href="standardization-and-the-parametric-g-formula.html#cb22-18" tabindex="-1"></a></span>
-<span id="cb22-19"><a href="standardization-and-the-parametric-g-formula.html#cb22-19" tabindex="-1"></a>  <span class="co"># linear model to estimate mean outcome conditional on treatment and confounders</span></span>
-<span id="cb22-20"><a href="standardization-and-the-parametric-g-formula.html#cb22-20" tabindex="-1"></a>  <span class="co"># parameters are estimated using original observations only (interv= -1)</span></span>
-<span id="cb22-21"><a href="standardization-and-the-parametric-g-formula.html#cb22-21" tabindex="-1"></a>  <span class="co"># parameter estimates are used to predict mean outcome for observations with set</span></span>
-<span id="cb22-22"><a href="standardization-and-the-parametric-g-formula.html#cb22-22" tabindex="-1"></a>  <span class="co"># treatment (interv=0 and interv=1)</span></span>
-<span id="cb22-23"><a href="standardization-and-the-parametric-g-formula.html#cb22-23" tabindex="-1"></a>  fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
-<span id="cb22-24"><a href="standardization-and-the-parametric-g-formula.html#cb22-24" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age) <span class="sc">+</span></span>
-<span id="cb22-25"><a href="standardization-and-the-parametric-g-formula.html#cb22-25" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
-<span id="cb22-26"><a href="standardization-and-the-parametric-g-formula.html#cb22-26" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span></span>
-<span id="cb22-27"><a href="standardization-and-the-parametric-g-formula.html#cb22-27" tabindex="-1"></a>                                                          smokeyrs) <span class="sc">+</span></span>
-<span id="cb22-28"><a href="standardization-and-the-parametric-g-formula.html#cb22-28" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span></span>
-<span id="cb22-29"><a href="standardization-and-the-parametric-g-formula.html#cb22-29" tabindex="-1"></a>                                                           wt71),</span>
-<span id="cb22-30"><a href="standardization-and-the-parametric-g-formula.html#cb22-30" tabindex="-1"></a>    <span class="at">data =</span> d.onesample</span>
-<span id="cb22-31"><a href="standardization-and-the-parametric-g-formula.html#cb22-31" tabindex="-1"></a>  )</span>
-<span id="cb22-32"><a href="standardization-and-the-parametric-g-formula.html#cb22-32" tabindex="-1"></a></span>
-<span id="cb22-33"><a href="standardization-and-the-parametric-g-formula.html#cb22-33" tabindex="-1"></a>  d.onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit, d.onesample)</span>
-<span id="cb22-34"><a href="standardization-and-the-parametric-g-formula.html#cb22-34" tabindex="-1"></a></span>
-<span id="cb22-35"><a href="standardization-and-the-parametric-g-formula.html#cb22-35" tabindex="-1"></a>  <span class="co"># estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1</span></span>
-<span id="cb22-36"><a href="standardization-and-the-parametric-g-formula.html#cb22-36" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">c</span>(</span>
-<span id="cb22-37"><a href="standardization-and-the-parametric-g-formula.html#cb22-37" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>]),</span>
-<span id="cb22-38"><a href="standardization-and-the-parametric-g-formula.html#cb22-38" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>]),</span>
-<span id="cb22-39"><a href="standardization-and-the-parametric-g-formula.html#cb22-39" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>]),</span>
-<span id="cb22-40"><a href="standardization-and-the-parametric-g-formula.html#cb22-40" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>]) <span class="sc">-</span></span>
-<span id="cb22-41"><a href="standardization-and-the-parametric-g-formula.html#cb22-41" tabindex="-1"></a>      <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>])</span>
-<span id="cb22-42"><a href="standardization-and-the-parametric-g-formula.html#cb22-42" tabindex="-1"></a>  ))</span>
-<span id="cb22-43"><a href="standardization-and-the-parametric-g-formula.html#cb22-43" tabindex="-1"></a>}</span>
-<span id="cb22-44"><a href="standardization-and-the-parametric-g-formula.html#cb22-44" tabindex="-1"></a></span>
-<span id="cb22-45"><a href="standardization-and-the-parametric-g-formula.html#cb22-45" tabindex="-1"></a><span class="co"># bootstrap</span></span>
-<span id="cb22-46"><a href="standardization-and-the-parametric-g-formula.html#cb22-46" tabindex="-1"></a>results <span class="ot">&lt;-</span> <span class="fu">boot</span>(<span class="at">data =</span> nhefs,</span>
-<span id="cb22-47"><a href="standardization-and-the-parametric-g-formula.html#cb22-47" tabindex="-1"></a>                <span class="at">statistic =</span> standardization,</span>
-<span id="cb22-48"><a href="standardization-and-the-parametric-g-formula.html#cb22-48" tabindex="-1"></a>                <span class="at">R =</span> <span class="dv">5</span>)</span>
-<span id="cb22-49"><a href="standardization-and-the-parametric-g-formula.html#cb22-49" tabindex="-1"></a></span>
-<span id="cb22-50"><a href="standardization-and-the-parametric-g-formula.html#cb22-50" tabindex="-1"></a><span class="co"># generating confidence intervals</span></span>
-<span id="cb22-51"><a href="standardization-and-the-parametric-g-formula.html#cb22-51" tabindex="-1"></a>se <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">1</span>]),</span>
-<span id="cb22-52"><a href="standardization-and-the-parametric-g-formula.html#cb22-52" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">2</span>]),</span>
-<span id="cb22-53"><a href="standardization-and-the-parametric-g-formula.html#cb22-53" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">3</span>]),</span>
-<span id="cb22-54"><a href="standardization-and-the-parametric-g-formula.html#cb22-54" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">4</span>]))</span>
-<span id="cb22-55"><a href="standardization-and-the-parametric-g-formula.html#cb22-55" tabindex="-1"></a>mean <span class="ot">&lt;-</span> results<span class="sc">$</span>t0</span>
-<span id="cb22-56"><a href="standardization-and-the-parametric-g-formula.html#cb22-56" tabindex="-1"></a>ll <span class="ot">&lt;-</span> mean <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> se</span>
-<span id="cb22-57"><a href="standardization-and-the-parametric-g-formula.html#cb22-57" tabindex="-1"></a>ul <span class="ot">&lt;-</span> mean <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> se</span>
-<span id="cb22-58"><a href="standardization-and-the-parametric-g-formula.html#cb22-58" tabindex="-1"></a></span>
-<span id="cb22-59"><a href="standardization-and-the-parametric-g-formula.html#cb22-59" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span></span>
-<span id="cb22-60"><a href="standardization-and-the-parametric-g-formula.html#cb22-60" tabindex="-1"></a>  <span class="fu">data.frame</span>(<span class="fu">cbind</span>(</span>
-<span id="cb22-61"><a href="standardization-and-the-parametric-g-formula.html#cb22-61" tabindex="-1"></a>    <span class="fu">c</span>(</span>
-<span id="cb22-62"><a href="standardization-and-the-parametric-g-formula.html#cb22-62" tabindex="-1"></a>      <span class="st">&quot;Observed&quot;</span>,</span>
-<span id="cb22-63"><a href="standardization-and-the-parametric-g-formula.html#cb22-63" tabindex="-1"></a>      <span class="st">&quot;No Treatment&quot;</span>,</span>
-<span id="cb22-64"><a href="standardization-and-the-parametric-g-formula.html#cb22-64" tabindex="-1"></a>      <span class="st">&quot;Treatment&quot;</span>,</span>
-<span id="cb22-65"><a href="standardization-and-the-parametric-g-formula.html#cb22-65" tabindex="-1"></a>      <span class="st">&quot;Treatment - No Treatment&quot;</span></span>
-<span id="cb22-66"><a href="standardization-and-the-parametric-g-formula.html#cb22-66" tabindex="-1"></a>    ),</span>
-<span id="cb22-67"><a href="standardization-and-the-parametric-g-formula.html#cb22-67" tabindex="-1"></a>    mean,</span>
-<span id="cb22-68"><a href="standardization-and-the-parametric-g-formula.html#cb22-68" tabindex="-1"></a>    se,</span>
-<span id="cb22-69"><a href="standardization-and-the-parametric-g-formula.html#cb22-69" tabindex="-1"></a>    ll,</span>
-<span id="cb22-70"><a href="standardization-and-the-parametric-g-formula.html#cb22-70" tabindex="-1"></a>    ul</span>
-<span id="cb22-71"><a href="standardization-and-the-parametric-g-formula.html#cb22-71" tabindex="-1"></a>  ))</span>
-<span id="cb22-72"><a href="standardization-and-the-parametric-g-formula.html#cb22-72" tabindex="-1"></a>bootstrap</span>
-<span id="cb22-73"><a href="standardization-and-the-parametric-g-formula.html#cb22-73" tabindex="-1"></a><span class="co">#&gt;                         V1             mean                 se               ll</span></span>
-<span id="cb22-74"><a href="standardization-and-the-parametric-g-formula.html#cb22-74" tabindex="-1"></a><span class="co">#&gt; 1                 Observed 2.56188497106099 0.0984024612972166 2.36901969092835</span></span>
-<span id="cb22-75"><a href="standardization-and-the-parametric-g-formula.html#cb22-75" tabindex="-1"></a><span class="co">#&gt; 2             No Treatment 1.65212306626744  0.212209617046544 1.23619985968317</span></span>
-<span id="cb22-76"><a href="standardization-and-the-parametric-g-formula.html#cb22-76" tabindex="-1"></a><span class="co">#&gt; 3                Treatment 5.11474489549336  0.641158250090791 3.85809781692468</span></span>
-<span id="cb22-77"><a href="standardization-and-the-parametric-g-formula.html#cb22-77" tabindex="-1"></a><span class="co">#&gt; 4 Treatment - No Treatment 3.46262182922592  0.828981620853456 1.83784770850751</span></span>
-<span id="cb22-78"><a href="standardization-and-the-parametric-g-formula.html#cb22-78" tabindex="-1"></a><span class="co">#&gt;                 ul</span></span>
-<span id="cb22-79"><a href="standardization-and-the-parametric-g-formula.html#cb22-79" tabindex="-1"></a><span class="co">#&gt; 1 2.75475025119363</span></span>
-<span id="cb22-80"><a href="standardization-and-the-parametric-g-formula.html#cb22-80" tabindex="-1"></a><span class="co">#&gt; 2  2.0680462728517</span></span>
-<span id="cb22-81"><a href="standardization-and-the-parametric-g-formula.html#cb22-81" tabindex="-1"></a><span class="co">#&gt; 3 6.37139197406203</span></span>
-<span id="cb22-82"><a href="standardization-and-the-parametric-g-formula.html#cb22-82" tabindex="-1"></a><span class="co">#&gt; 4 5.08739594994433</span></span></code></pre></div>
+<div class="sourceCode" id="cb95"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb95-1"><a href="standardization-and-the-parametric-g-formula.html#cb95-1" tabindex="-1"></a><span class="co">#install.packages(&quot;boot&quot;) # install package if required</span></span>
+<span id="cb95-2"><a href="standardization-and-the-parametric-g-formula.html#cb95-2" tabindex="-1"></a><span class="fu">library</span>(boot)</span>
+<span id="cb95-3"><a href="standardization-and-the-parametric-g-formula.html#cb95-3" tabindex="-1"></a></span>
+<span id="cb95-4"><a href="standardization-and-the-parametric-g-formula.html#cb95-4" tabindex="-1"></a><span class="co"># function to calculate difference in means</span></span>
+<span id="cb95-5"><a href="standardization-and-the-parametric-g-formula.html#cb95-5" tabindex="-1"></a>standardization <span class="ot">&lt;-</span> <span class="cf">function</span>(data, indices) {</span>
+<span id="cb95-6"><a href="standardization-and-the-parametric-g-formula.html#cb95-6" tabindex="-1"></a>  <span class="co"># create a dataset with 3 copies of each subject</span></span>
+<span id="cb95-7"><a href="standardization-and-the-parametric-g-formula.html#cb95-7" tabindex="-1"></a>  d <span class="ot">&lt;-</span> data[indices, ] <span class="co"># 1st copy: equal to original one`</span></span>
+<span id="cb95-8"><a href="standardization-and-the-parametric-g-formula.html#cb95-8" tabindex="-1"></a>  d<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="sc">-</span><span class="dv">1</span></span>
+<span id="cb95-9"><a href="standardization-and-the-parametric-g-formula.html#cb95-9" tabindex="-1"></a>  d0 <span class="ot">&lt;-</span> d <span class="co"># 2nd copy: treatment set to 0, outcome to missing</span></span>
+<span id="cb95-10"><a href="standardization-and-the-parametric-g-formula.html#cb95-10" tabindex="-1"></a>  d0<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb95-11"><a href="standardization-and-the-parametric-g-formula.html#cb95-11" tabindex="-1"></a>  d0<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb95-12"><a href="standardization-and-the-parametric-g-formula.html#cb95-12" tabindex="-1"></a>  d0<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb95-13"><a href="standardization-and-the-parametric-g-formula.html#cb95-13" tabindex="-1"></a>  d1 <span class="ot">&lt;-</span> d <span class="co"># 3rd copy: treatment set to 1, outcome to missing</span></span>
+<span id="cb95-14"><a href="standardization-and-the-parametric-g-formula.html#cb95-14" tabindex="-1"></a>  d1<span class="sc">$</span>interv <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb95-15"><a href="standardization-and-the-parametric-g-formula.html#cb95-15" tabindex="-1"></a>  d1<span class="sc">$</span>qsmk <span class="ot">&lt;-</span> <span class="dv">1</span></span>
+<span id="cb95-16"><a href="standardization-and-the-parametric-g-formula.html#cb95-16" tabindex="-1"></a>  d1<span class="sc">$</span>wt82_71 <span class="ot">&lt;-</span> <span class="cn">NA</span></span>
+<span id="cb95-17"><a href="standardization-and-the-parametric-g-formula.html#cb95-17" tabindex="-1"></a>  d.onesample <span class="ot">&lt;-</span> <span class="fu">rbind</span>(d, d0, d1) <span class="co"># combining datasets</span></span>
+<span id="cb95-18"><a href="standardization-and-the-parametric-g-formula.html#cb95-18" tabindex="-1"></a></span>
+<span id="cb95-19"><a href="standardization-and-the-parametric-g-formula.html#cb95-19" tabindex="-1"></a>  <span class="co"># linear model to estimate mean outcome conditional on treatment and confounders</span></span>
+<span id="cb95-20"><a href="standardization-and-the-parametric-g-formula.html#cb95-20" tabindex="-1"></a>  <span class="co"># parameters are estimated using original observations only (interv= -1)</span></span>
+<span id="cb95-21"><a href="standardization-and-the-parametric-g-formula.html#cb95-21" tabindex="-1"></a>  <span class="co"># parameter estimates are used to predict mean outcome for observations with set</span></span>
+<span id="cb95-22"><a href="standardization-and-the-parametric-g-formula.html#cb95-22" tabindex="-1"></a>  <span class="co"># treatment (interv=0 and interv=1)</span></span>
+<span id="cb95-23"><a href="standardization-and-the-parametric-g-formula.html#cb95-23" tabindex="-1"></a>  fit <span class="ot">&lt;-</span> <span class="fu">glm</span>(</span>
+<span id="cb95-24"><a href="standardization-and-the-parametric-g-formula.html#cb95-24" tabindex="-1"></a>    wt82_71 <span class="sc">~</span> qsmk <span class="sc">+</span> sex <span class="sc">+</span> race <span class="sc">+</span> age <span class="sc">+</span> <span class="fu">I</span>(age <span class="sc">*</span> age) <span class="sc">+</span></span>
+<span id="cb95-25"><a href="standardization-and-the-parametric-g-formula.html#cb95-25" tabindex="-1"></a>      <span class="fu">as.factor</span>(education) <span class="sc">+</span> smokeintensity <span class="sc">+</span></span>
+<span id="cb95-26"><a href="standardization-and-the-parametric-g-formula.html#cb95-26" tabindex="-1"></a>      <span class="fu">I</span>(smokeintensity <span class="sc">*</span> smokeintensity) <span class="sc">+</span> smokeyrs <span class="sc">+</span> <span class="fu">I</span>(smokeyrs <span class="sc">*</span></span>
+<span id="cb95-27"><a href="standardization-and-the-parametric-g-formula.html#cb95-27" tabindex="-1"></a>                                                          smokeyrs) <span class="sc">+</span></span>
+<span id="cb95-28"><a href="standardization-and-the-parametric-g-formula.html#cb95-28" tabindex="-1"></a>      <span class="fu">as.factor</span>(exercise) <span class="sc">+</span> <span class="fu">as.factor</span>(active) <span class="sc">+</span> wt71 <span class="sc">+</span> <span class="fu">I</span>(wt71 <span class="sc">*</span></span>
+<span id="cb95-29"><a href="standardization-and-the-parametric-g-formula.html#cb95-29" tabindex="-1"></a>                                                           wt71),</span>
+<span id="cb95-30"><a href="standardization-and-the-parametric-g-formula.html#cb95-30" tabindex="-1"></a>    <span class="at">data =</span> d.onesample</span>
+<span id="cb95-31"><a href="standardization-and-the-parametric-g-formula.html#cb95-31" tabindex="-1"></a>  )</span>
+<span id="cb95-32"><a href="standardization-and-the-parametric-g-formula.html#cb95-32" tabindex="-1"></a></span>
+<span id="cb95-33"><a href="standardization-and-the-parametric-g-formula.html#cb95-33" tabindex="-1"></a>  d.onesample<span class="sc">$</span>predicted_meanY <span class="ot">&lt;-</span> <span class="fu">predict</span>(fit, d.onesample)</span>
+<span id="cb95-34"><a href="standardization-and-the-parametric-g-formula.html#cb95-34" tabindex="-1"></a></span>
+<span id="cb95-35"><a href="standardization-and-the-parametric-g-formula.html#cb95-35" tabindex="-1"></a>  <span class="co"># estimate mean outcome in each of the groups interv=-1, interv=0, and interv=1</span></span>
+<span id="cb95-36"><a href="standardization-and-the-parametric-g-formula.html#cb95-36" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">c</span>(</span>
+<span id="cb95-37"><a href="standardization-and-the-parametric-g-formula.html#cb95-37" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="sc">-</span><span class="dv">1</span>]),</span>
+<span id="cb95-38"><a href="standardization-and-the-parametric-g-formula.html#cb95-38" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>]),</span>
+<span id="cb95-39"><a href="standardization-and-the-parametric-g-formula.html#cb95-39" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>]),</span>
+<span id="cb95-40"><a href="standardization-and-the-parametric-g-formula.html#cb95-40" tabindex="-1"></a>    <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">1</span>]) <span class="sc">-</span></span>
+<span id="cb95-41"><a href="standardization-and-the-parametric-g-formula.html#cb95-41" tabindex="-1"></a>      <span class="fu">mean</span>(d.onesample<span class="sc">$</span>predicted_meanY[d.onesample<span class="sc">$</span>interv <span class="sc">==</span> <span class="dv">0</span>])</span>
+<span id="cb95-42"><a href="standardization-and-the-parametric-g-formula.html#cb95-42" tabindex="-1"></a>  ))</span>
+<span id="cb95-43"><a href="standardization-and-the-parametric-g-formula.html#cb95-43" tabindex="-1"></a>}</span>
+<span id="cb95-44"><a href="standardization-and-the-parametric-g-formula.html#cb95-44" tabindex="-1"></a></span>
+<span id="cb95-45"><a href="standardization-and-the-parametric-g-formula.html#cb95-45" tabindex="-1"></a><span class="co"># bootstrap</span></span>
+<span id="cb95-46"><a href="standardization-and-the-parametric-g-formula.html#cb95-46" tabindex="-1"></a>results <span class="ot">&lt;-</span> <span class="fu">boot</span>(<span class="at">data =</span> nhefs,</span>
+<span id="cb95-47"><a href="standardization-and-the-parametric-g-formula.html#cb95-47" tabindex="-1"></a>                <span class="at">statistic =</span> standardization,</span>
+<span id="cb95-48"><a href="standardization-and-the-parametric-g-formula.html#cb95-48" tabindex="-1"></a>                <span class="at">R =</span> <span class="dv">5</span>)</span>
+<span id="cb95-49"><a href="standardization-and-the-parametric-g-formula.html#cb95-49" tabindex="-1"></a></span>
+<span id="cb95-50"><a href="standardization-and-the-parametric-g-formula.html#cb95-50" tabindex="-1"></a><span class="co"># generating confidence intervals</span></span>
+<span id="cb95-51"><a href="standardization-and-the-parametric-g-formula.html#cb95-51" tabindex="-1"></a>se <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">1</span>]),</span>
+<span id="cb95-52"><a href="standardization-and-the-parametric-g-formula.html#cb95-52" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">2</span>]),</span>
+<span id="cb95-53"><a href="standardization-and-the-parametric-g-formula.html#cb95-53" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">3</span>]),</span>
+<span id="cb95-54"><a href="standardization-and-the-parametric-g-formula.html#cb95-54" tabindex="-1"></a>        <span class="fu">sd</span>(results<span class="sc">$</span>t[, <span class="dv">4</span>]))</span>
+<span id="cb95-55"><a href="standardization-and-the-parametric-g-formula.html#cb95-55" tabindex="-1"></a>mean <span class="ot">&lt;-</span> results<span class="sc">$</span>t0</span>
+<span id="cb95-56"><a href="standardization-and-the-parametric-g-formula.html#cb95-56" tabindex="-1"></a>ll <span class="ot">&lt;-</span> mean <span class="sc">-</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> se</span>
+<span id="cb95-57"><a href="standardization-and-the-parametric-g-formula.html#cb95-57" tabindex="-1"></a>ul <span class="ot">&lt;-</span> mean <span class="sc">+</span> <span class="fu">qnorm</span>(<span class="fl">0.975</span>) <span class="sc">*</span> se</span>
+<span id="cb95-58"><a href="standardization-and-the-parametric-g-formula.html#cb95-58" tabindex="-1"></a></span>
+<span id="cb95-59"><a href="standardization-and-the-parametric-g-formula.html#cb95-59" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span></span>
+<span id="cb95-60"><a href="standardization-and-the-parametric-g-formula.html#cb95-60" tabindex="-1"></a>  <span class="fu">data.frame</span>(<span class="fu">cbind</span>(</span>
+<span id="cb95-61"><a href="standardization-and-the-parametric-g-formula.html#cb95-61" tabindex="-1"></a>    <span class="fu">c</span>(</span>
+<span id="cb95-62"><a href="standardization-and-the-parametric-g-formula.html#cb95-62" tabindex="-1"></a>      <span class="st">&quot;Observed&quot;</span>,</span>
+<span id="cb95-63"><a href="standardization-and-the-parametric-g-formula.html#cb95-63" tabindex="-1"></a>      <span class="st">&quot;No Treatment&quot;</span>,</span>
+<span id="cb95-64"><a href="standardization-and-the-parametric-g-formula.html#cb95-64" tabindex="-1"></a>      <span class="st">&quot;Treatment&quot;</span>,</span>
+<span id="cb95-65"><a href="standardization-and-the-parametric-g-formula.html#cb95-65" tabindex="-1"></a>      <span class="st">&quot;Treatment - No Treatment&quot;</span></span>
+<span id="cb95-66"><a href="standardization-and-the-parametric-g-formula.html#cb95-66" tabindex="-1"></a>    ),</span>
+<span id="cb95-67"><a href="standardization-and-the-parametric-g-formula.html#cb95-67" tabindex="-1"></a>    mean,</span>
+<span id="cb95-68"><a href="standardization-and-the-parametric-g-formula.html#cb95-68" tabindex="-1"></a>    se,</span>
+<span id="cb95-69"><a href="standardization-and-the-parametric-g-formula.html#cb95-69" tabindex="-1"></a>    ll,</span>
+<span id="cb95-70"><a href="standardization-and-the-parametric-g-formula.html#cb95-70" tabindex="-1"></a>    ul</span>
+<span id="cb95-71"><a href="standardization-and-the-parametric-g-formula.html#cb95-71" tabindex="-1"></a>  ))</span>
+<span id="cb95-72"><a href="standardization-and-the-parametric-g-formula.html#cb95-72" tabindex="-1"></a>bootstrap</span>
+<span id="cb95-73"><a href="standardization-and-the-parametric-g-formula.html#cb95-73" tabindex="-1"></a><span class="co">#&gt;                         V1             mean                se               ll</span></span>
+<span id="cb95-74"><a href="standardization-and-the-parametric-g-formula.html#cb95-74" tabindex="-1"></a><span class="co">#&gt; 1                 Observed 2.56188497106099 0.145472494596704 2.27676412091025</span></span>
+<span id="cb95-75"><a href="standardization-and-the-parametric-g-formula.html#cb95-75" tabindex="-1"></a><span class="co">#&gt; 2             No Treatment 1.65212306626744 0.101915266567174 1.45237281432098</span></span>
+<span id="cb95-76"><a href="standardization-and-the-parametric-g-formula.html#cb95-76" tabindex="-1"></a><span class="co">#&gt; 3                Treatment 5.11474489549336 0.333215898342795 4.46165373566532</span></span>
+<span id="cb95-77"><a href="standardization-and-the-parametric-g-formula.html#cb95-77" tabindex="-1"></a><span class="co">#&gt; 4 Treatment - No Treatment 3.46262182922592 0.301829821703863  2.8710462492262</span></span>
+<span id="cb95-78"><a href="standardization-and-the-parametric-g-formula.html#cb95-78" tabindex="-1"></a><span class="co">#&gt;                 ul</span></span>
+<span id="cb95-79"><a href="standardization-and-the-parametric-g-formula.html#cb95-79" tabindex="-1"></a><span class="co">#&gt; 1 2.84700582121172</span></span>
+<span id="cb95-80"><a href="standardization-and-the-parametric-g-formula.html#cb95-80" tabindex="-1"></a><span class="co">#&gt; 2  1.8518733182139</span></span>
+<span id="cb95-81"><a href="standardization-and-the-parametric-g-formula.html#cb95-81" tabindex="-1"></a><span class="co">#&gt; 3 5.76783605532139</span></span>
+<span id="cb95-82"><a href="standardization-and-the-parametric-g-formula.html#cb95-82" tabindex="-1"></a><span class="co">#&gt; 4 4.05419740922564</span></span></code></pre></div>
 
 </div>
 </div>
diff --git a/docs/why-model-stata.html b/docs/why-model-stata.html
index 729f8f5..73029bb 100644
--- a/docs/why-model-stata.html
+++ b/docs/why-model-stata.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -310,8 +310,8 @@ <h1>
             <section class="normal" id="section-">
 <div id="why-model-stata" class="section level1 unnumbered hasAnchor">
 <h1>11. Why model: Stata<a href="why-model-stata.html#why-model-stata" class="anchor-section" aria-label="Anchor link to header"></a></h1>
-<div class="sourceCode" id="cb50"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb50-1"><a href="why-model-stata.html#cb50-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
-<div class="sourceCode" id="cb51"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb51-1"><a href="why-model-stata.html#cb51-1" tabindex="-1"></a><span class="kw">do</span> dependency</span></code></pre></div>
+<div class="sourceCode" id="cb167"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb167-1"><a href="why-model-stata.html#cb167-1" tabindex="-1"></a><span class="fu">library</span>(Statamarkdown)</span></code></pre></div>
+<div class="sourceCode" id="cb168"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb168-1"><a href="why-model-stata.html#cb168-1" tabindex="-1"></a><span class="kw">do</span> dependency</span></code></pre></div>
 <pre><code>checking extremes consistency and verifying not already installed...
 all files already exist and are up to date.
 
@@ -329,38 +329,38 @@ <h2>Program 11.1<a href="why-model-stata.html#program-11.1-1" class="anchor-sect
 <li>Figures 11.1, 11.2, and 11.3</li>
 <li>Sample averages by treatment level</li>
 </ul>
-<div class="sourceCode" id="cb54"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb54-1"><a href="why-model-stata.html#cb54-1" tabindex="-1"></a><span class="kw">clear</span></span>
-<span id="cb54-2"><a href="why-model-stata.html#cb54-2" tabindex="-1"></a></span>
-<span id="cb54-3"><a href="why-model-stata.html#cb54-3" tabindex="-1"></a>**Figure 11.1**</span>
-<span id="cb54-4"><a href="why-model-stata.html#cb54-4" tabindex="-1"></a>*create the dataset*</span>
-<span id="cb54-5"><a href="why-model-stata.html#cb54-5" tabindex="-1"></a>input A Y</span>
-<span id="cb54-6"><a href="why-model-stata.html#cb54-6" tabindex="-1"></a>1 200</span>
-<span id="cb54-7"><a href="why-model-stata.html#cb54-7" tabindex="-1"></a>1 150</span>
-<span id="cb54-8"><a href="why-model-stata.html#cb54-8" tabindex="-1"></a>1 220</span>
-<span id="cb54-9"><a href="why-model-stata.html#cb54-9" tabindex="-1"></a>1 110</span>
-<span id="cb54-10"><a href="why-model-stata.html#cb54-10" tabindex="-1"></a>1 50</span>
-<span id="cb54-11"><a href="why-model-stata.html#cb54-11" tabindex="-1"></a>1 180</span>
-<span id="cb54-12"><a href="why-model-stata.html#cb54-12" tabindex="-1"></a>1 90</span>
-<span id="cb54-13"><a href="why-model-stata.html#cb54-13" tabindex="-1"></a>1 170</span>
-<span id="cb54-14"><a href="why-model-stata.html#cb54-14" tabindex="-1"></a>0 170</span>
-<span id="cb54-15"><a href="why-model-stata.html#cb54-15" tabindex="-1"></a>0 30</span>
-<span id="cb54-16"><a href="why-model-stata.html#cb54-16" tabindex="-1"></a>0 70</span>
-<span id="cb54-17"><a href="why-model-stata.html#cb54-17" tabindex="-1"></a>0 110</span>
-<span id="cb54-18"><a href="why-model-stata.html#cb54-18" tabindex="-1"></a>0 80</span>
-<span id="cb54-19"><a href="why-model-stata.html#cb54-19" tabindex="-1"></a>0 50</span>
-<span id="cb54-20"><a href="why-model-stata.html#cb54-20" tabindex="-1"></a>0 10</span>
-<span id="cb54-21"><a href="why-model-stata.html#cb54-21" tabindex="-1"></a>0 20</span>
-<span id="cb54-22"><a href="why-model-stata.html#cb54-22" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb54-23"><a href="why-model-stata.html#cb54-23" tabindex="-1"></a></span>
-<span id="cb54-24"><a href="why-model-stata.html#cb54-24" tabindex="-1"></a>*Save the <span class="kw">data</span>*</span>
-<span id="cb54-25"><a href="why-model-stata.html#cb54-25" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig1, <span class="kw">replace</span></span>
-<span id="cb54-26"><a href="why-model-stata.html#cb54-26" tabindex="-1"></a></span>
-<span id="cb54-27"><a href="why-model-stata.html#cb54-27" tabindex="-1"></a>*Build the scatterplot*</span>
-<span id="cb54-28"><a href="why-model-stata.html#cb54-28" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0 1) <span class="bn">xscale</span>(<span class="kw">range</span>(-0.5 1.5))</span>
-<span id="cb54-29"><a href="why-model-stata.html#cb54-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-1.png, <span class="kw">replace</span></span>
-<span id="cb54-30"><a href="why-model-stata.html#cb54-30" tabindex="-1"></a></span>
-<span id="cb54-31"><a href="why-model-stata.html#cb54-31" tabindex="-1"></a>*Output the <span class="kw">mean</span> <span class="kw">values</span> <span class="kw">for</span> Y <span class="kw">in</span> each <span class="dv">level</span> <span class="kw">of</span> A*</span>
-<span id="cb54-32"><a href="why-model-stata.html#cb54-32" tabindex="-1"></a><span class="kw">bysort</span> A: <span class="kw">sum</span> Y</span></code></pre></div>
+<div class="sourceCode" id="cb171"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb171-1"><a href="why-model-stata.html#cb171-1" tabindex="-1"></a><span class="kw">clear</span></span>
+<span id="cb171-2"><a href="why-model-stata.html#cb171-2" tabindex="-1"></a></span>
+<span id="cb171-3"><a href="why-model-stata.html#cb171-3" tabindex="-1"></a>**Figure 11.1**</span>
+<span id="cb171-4"><a href="why-model-stata.html#cb171-4" tabindex="-1"></a>*create the dataset*</span>
+<span id="cb171-5"><a href="why-model-stata.html#cb171-5" tabindex="-1"></a>input A Y</span>
+<span id="cb171-6"><a href="why-model-stata.html#cb171-6" tabindex="-1"></a>1 200</span>
+<span id="cb171-7"><a href="why-model-stata.html#cb171-7" tabindex="-1"></a>1 150</span>
+<span id="cb171-8"><a href="why-model-stata.html#cb171-8" tabindex="-1"></a>1 220</span>
+<span id="cb171-9"><a href="why-model-stata.html#cb171-9" tabindex="-1"></a>1 110</span>
+<span id="cb171-10"><a href="why-model-stata.html#cb171-10" tabindex="-1"></a>1 50</span>
+<span id="cb171-11"><a href="why-model-stata.html#cb171-11" tabindex="-1"></a>1 180</span>
+<span id="cb171-12"><a href="why-model-stata.html#cb171-12" tabindex="-1"></a>1 90</span>
+<span id="cb171-13"><a href="why-model-stata.html#cb171-13" tabindex="-1"></a>1 170</span>
+<span id="cb171-14"><a href="why-model-stata.html#cb171-14" tabindex="-1"></a>0 170</span>
+<span id="cb171-15"><a href="why-model-stata.html#cb171-15" tabindex="-1"></a>0 30</span>
+<span id="cb171-16"><a href="why-model-stata.html#cb171-16" tabindex="-1"></a>0 70</span>
+<span id="cb171-17"><a href="why-model-stata.html#cb171-17" tabindex="-1"></a>0 110</span>
+<span id="cb171-18"><a href="why-model-stata.html#cb171-18" tabindex="-1"></a>0 80</span>
+<span id="cb171-19"><a href="why-model-stata.html#cb171-19" tabindex="-1"></a>0 50</span>
+<span id="cb171-20"><a href="why-model-stata.html#cb171-20" tabindex="-1"></a>0 10</span>
+<span id="cb171-21"><a href="why-model-stata.html#cb171-21" tabindex="-1"></a>0 20</span>
+<span id="cb171-22"><a href="why-model-stata.html#cb171-22" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb171-23"><a href="why-model-stata.html#cb171-23" tabindex="-1"></a></span>
+<span id="cb171-24"><a href="why-model-stata.html#cb171-24" tabindex="-1"></a>*Save the <span class="kw">data</span>*</span>
+<span id="cb171-25"><a href="why-model-stata.html#cb171-25" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig1, <span class="kw">replace</span></span>
+<span id="cb171-26"><a href="why-model-stata.html#cb171-26" tabindex="-1"></a></span>
+<span id="cb171-27"><a href="why-model-stata.html#cb171-27" tabindex="-1"></a>*Build the scatterplot*</span>
+<span id="cb171-28"><a href="why-model-stata.html#cb171-28" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0 1) <span class="bn">xscale</span>(<span class="kw">range</span>(-0.5 1.5))</span>
+<span id="cb171-29"><a href="why-model-stata.html#cb171-29" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-1.png, <span class="kw">replace</span></span>
+<span id="cb171-30"><a href="why-model-stata.html#cb171-30" tabindex="-1"></a></span>
+<span id="cb171-31"><a href="why-model-stata.html#cb171-31" tabindex="-1"></a>*Output the <span class="kw">mean</span> <span class="kw">values</span> <span class="kw">for</span> Y <span class="kw">in</span> each <span class="dv">level</span> <span class="kw">of</span> A*</span>
+<span id="cb171-32"><a href="why-model-stata.html#cb171-32" tabindex="-1"></a><span class="kw">bysort</span> A: <span class="kw">sum</span> Y</span></code></pre></div>
 <pre><code>             A          Y
   1. 1 200
   2. 1 150
@@ -398,35 +398,35 @@ <h2>Program 11.1<a href="why-model-stata.html#program-11.1-1" class="anchor-sect
 -------------+---------------------------------------------------------
            Y |          8      146.25     58.2942         50        220</code></pre>
 <p><img src="figs/stata-fig-11-1.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb56"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb56-1"><a href="why-model-stata.html#cb56-1" tabindex="-1"></a>*Clear the workspace to <span class="kw">be</span> able to <span class="kw">use</span> a <span class="kw">new</span> dataset*</span>
-<span id="cb56-2"><a href="why-model-stata.html#cb56-2" tabindex="-1"></a><span class="kw">clear</span></span>
-<span id="cb56-3"><a href="why-model-stata.html#cb56-3" tabindex="-1"></a></span>
-<span id="cb56-4"><a href="why-model-stata.html#cb56-4" tabindex="-1"></a>**Figure 11.2**</span>
-<span id="cb56-5"><a href="why-model-stata.html#cb56-5" tabindex="-1"></a>input A Y</span>
-<span id="cb56-6"><a href="why-model-stata.html#cb56-6" tabindex="-1"></a>1 110</span>
-<span id="cb56-7"><a href="why-model-stata.html#cb56-7" tabindex="-1"></a>1 80</span>
-<span id="cb56-8"><a href="why-model-stata.html#cb56-8" tabindex="-1"></a>1 50</span>
-<span id="cb56-9"><a href="why-model-stata.html#cb56-9" tabindex="-1"></a>1 40</span>
-<span id="cb56-10"><a href="why-model-stata.html#cb56-10" tabindex="-1"></a>2 170</span>
-<span id="cb56-11"><a href="why-model-stata.html#cb56-11" tabindex="-1"></a>2 30</span>
-<span id="cb56-12"><a href="why-model-stata.html#cb56-12" tabindex="-1"></a>2 70</span>
-<span id="cb56-13"><a href="why-model-stata.html#cb56-13" tabindex="-1"></a>2 50</span>
-<span id="cb56-14"><a href="why-model-stata.html#cb56-14" tabindex="-1"></a>3 110</span>
-<span id="cb56-15"><a href="why-model-stata.html#cb56-15" tabindex="-1"></a>3 50</span>
-<span id="cb56-16"><a href="why-model-stata.html#cb56-16" tabindex="-1"></a>3 180</span>
-<span id="cb56-17"><a href="why-model-stata.html#cb56-17" tabindex="-1"></a>3 130</span>
-<span id="cb56-18"><a href="why-model-stata.html#cb56-18" tabindex="-1"></a>4 200</span>
-<span id="cb56-19"><a href="why-model-stata.html#cb56-19" tabindex="-1"></a>4 150</span>
-<span id="cb56-20"><a href="why-model-stata.html#cb56-20" tabindex="-1"></a>4 220</span>
-<span id="cb56-21"><a href="why-model-stata.html#cb56-21" tabindex="-1"></a>4 210</span>
-<span id="cb56-22"><a href="why-model-stata.html#cb56-22" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb56-23"><a href="why-model-stata.html#cb56-23" tabindex="-1"></a></span>
-<span id="cb56-24"><a href="why-model-stata.html#cb56-24" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig2, <span class="kw">replace</span></span>
-<span id="cb56-25"><a href="why-model-stata.html#cb56-25" tabindex="-1"></a></span>
-<span id="cb56-26"><a href="why-model-stata.html#cb56-26" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(1)4) <span class="bn">xscale</span>(<span class="kw">range</span>(0 4.5))</span>
-<span id="cb56-27"><a href="why-model-stata.html#cb56-27" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-2.png, <span class="kw">replace</span></span>
-<span id="cb56-28"><a href="why-model-stata.html#cb56-28" tabindex="-1"></a></span>
-<span id="cb56-29"><a href="why-model-stata.html#cb56-29" tabindex="-1"></a><span class="kw">bysort</span> A: <span class="kw">sum</span> Y</span></code></pre></div>
+<div class="sourceCode" id="cb173"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb173-1"><a href="why-model-stata.html#cb173-1" tabindex="-1"></a>*Clear the workspace to <span class="kw">be</span> able to <span class="kw">use</span> a <span class="kw">new</span> dataset*</span>
+<span id="cb173-2"><a href="why-model-stata.html#cb173-2" tabindex="-1"></a><span class="kw">clear</span></span>
+<span id="cb173-3"><a href="why-model-stata.html#cb173-3" tabindex="-1"></a></span>
+<span id="cb173-4"><a href="why-model-stata.html#cb173-4" tabindex="-1"></a>**Figure 11.2**</span>
+<span id="cb173-5"><a href="why-model-stata.html#cb173-5" tabindex="-1"></a>input A Y</span>
+<span id="cb173-6"><a href="why-model-stata.html#cb173-6" tabindex="-1"></a>1 110</span>
+<span id="cb173-7"><a href="why-model-stata.html#cb173-7" tabindex="-1"></a>1 80</span>
+<span id="cb173-8"><a href="why-model-stata.html#cb173-8" tabindex="-1"></a>1 50</span>
+<span id="cb173-9"><a href="why-model-stata.html#cb173-9" tabindex="-1"></a>1 40</span>
+<span id="cb173-10"><a href="why-model-stata.html#cb173-10" tabindex="-1"></a>2 170</span>
+<span id="cb173-11"><a href="why-model-stata.html#cb173-11" tabindex="-1"></a>2 30</span>
+<span id="cb173-12"><a href="why-model-stata.html#cb173-12" tabindex="-1"></a>2 70</span>
+<span id="cb173-13"><a href="why-model-stata.html#cb173-13" tabindex="-1"></a>2 50</span>
+<span id="cb173-14"><a href="why-model-stata.html#cb173-14" tabindex="-1"></a>3 110</span>
+<span id="cb173-15"><a href="why-model-stata.html#cb173-15" tabindex="-1"></a>3 50</span>
+<span id="cb173-16"><a href="why-model-stata.html#cb173-16" tabindex="-1"></a>3 180</span>
+<span id="cb173-17"><a href="why-model-stata.html#cb173-17" tabindex="-1"></a>3 130</span>
+<span id="cb173-18"><a href="why-model-stata.html#cb173-18" tabindex="-1"></a>4 200</span>
+<span id="cb173-19"><a href="why-model-stata.html#cb173-19" tabindex="-1"></a>4 150</span>
+<span id="cb173-20"><a href="why-model-stata.html#cb173-20" tabindex="-1"></a>4 220</span>
+<span id="cb173-21"><a href="why-model-stata.html#cb173-21" tabindex="-1"></a>4 210</span>
+<span id="cb173-22"><a href="why-model-stata.html#cb173-22" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb173-23"><a href="why-model-stata.html#cb173-23" tabindex="-1"></a></span>
+<span id="cb173-24"><a href="why-model-stata.html#cb173-24" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig2, <span class="kw">replace</span></span>
+<span id="cb173-25"><a href="why-model-stata.html#cb173-25" tabindex="-1"></a></span>
+<span id="cb173-26"><a href="why-model-stata.html#cb173-26" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(1)4) <span class="bn">xscale</span>(<span class="kw">range</span>(0 4.5))</span>
+<span id="cb173-27"><a href="why-model-stata.html#cb173-27" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-2.png, <span class="kw">replace</span></span>
+<span id="cb173-28"><a href="why-model-stata.html#cb173-28" tabindex="-1"></a></span>
+<span id="cb173-29"><a href="why-model-stata.html#cb173-29" tabindex="-1"></a><span class="kw">bysort</span> A: <span class="kw">sum</span> Y</span></code></pre></div>
 <pre><code>             A          Y
   1. 1 110
   2. 1 80
@@ -478,32 +478,32 @@ <h2>Program 11.1<a href="why-model-stata.html#program-11.1-1" class="anchor-sect
 -------------+---------------------------------------------------------
            Y |          4         195    31.09126        150        220</code></pre>
 <p><img src="figs/stata-fig-11-2.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb58"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb58-1"><a href="why-model-stata.html#cb58-1" tabindex="-1"></a><span class="kw">clear</span></span>
-<span id="cb58-2"><a href="why-model-stata.html#cb58-2" tabindex="-1"></a></span>
-<span id="cb58-3"><a href="why-model-stata.html#cb58-3" tabindex="-1"></a>**Figure 11.3**</span>
-<span id="cb58-4"><a href="why-model-stata.html#cb58-4" tabindex="-1"></a>input A Y</span>
-<span id="cb58-5"><a href="why-model-stata.html#cb58-5" tabindex="-1"></a>3   21  </span>
-<span id="cb58-6"><a href="why-model-stata.html#cb58-6" tabindex="-1"></a>11  54</span>
-<span id="cb58-7"><a href="why-model-stata.html#cb58-7" tabindex="-1"></a>17  33</span>
-<span id="cb58-8"><a href="why-model-stata.html#cb58-8" tabindex="-1"></a>23  101</span>
-<span id="cb58-9"><a href="why-model-stata.html#cb58-9" tabindex="-1"></a>29  85</span>
-<span id="cb58-10"><a href="why-model-stata.html#cb58-10" tabindex="-1"></a>37  65</span>
-<span id="cb58-11"><a href="why-model-stata.html#cb58-11" tabindex="-1"></a>41  157</span>
-<span id="cb58-12"><a href="why-model-stata.html#cb58-12" tabindex="-1"></a>53  120</span>
-<span id="cb58-13"><a href="why-model-stata.html#cb58-13" tabindex="-1"></a>67  111</span>
-<span id="cb58-14"><a href="why-model-stata.html#cb58-14" tabindex="-1"></a>79  200</span>
-<span id="cb58-15"><a href="why-model-stata.html#cb58-15" tabindex="-1"></a>83  140</span>
-<span id="cb58-16"><a href="why-model-stata.html#cb58-16" tabindex="-1"></a>97  220</span>
-<span id="cb58-17"><a href="why-model-stata.html#cb58-17" tabindex="-1"></a>60  230</span>
-<span id="cb58-18"><a href="why-model-stata.html#cb58-18" tabindex="-1"></a>71  217</span>
-<span id="cb58-19"><a href="why-model-stata.html#cb58-19" tabindex="-1"></a>15  11</span>
-<span id="cb58-20"><a href="why-model-stata.html#cb58-20" tabindex="-1"></a>45  190</span>
-<span id="cb58-21"><a href="why-model-stata.html#cb58-21" tabindex="-1"></a><span class="kw">end</span></span>
-<span id="cb58-22"><a href="why-model-stata.html#cb58-22" tabindex="-1"></a></span>
-<span id="cb58-23"><a href="why-model-stata.html#cb58-23" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig3, <span class="kw">replace</span></span>
-<span id="cb58-24"><a href="why-model-stata.html#cb58-24" tabindex="-1"></a></span>
-<span id="cb58-25"><a href="why-model-stata.html#cb58-25" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100))</span>
-<span id="cb58-26"><a href="why-model-stata.html#cb58-26" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-3.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb175"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb175-1"><a href="why-model-stata.html#cb175-1" tabindex="-1"></a><span class="kw">clear</span></span>
+<span id="cb175-2"><a href="why-model-stata.html#cb175-2" tabindex="-1"></a></span>
+<span id="cb175-3"><a href="why-model-stata.html#cb175-3" tabindex="-1"></a>**Figure 11.3**</span>
+<span id="cb175-4"><a href="why-model-stata.html#cb175-4" tabindex="-1"></a>input A Y</span>
+<span id="cb175-5"><a href="why-model-stata.html#cb175-5" tabindex="-1"></a>3   21  </span>
+<span id="cb175-6"><a href="why-model-stata.html#cb175-6" tabindex="-1"></a>11  54</span>
+<span id="cb175-7"><a href="why-model-stata.html#cb175-7" tabindex="-1"></a>17  33</span>
+<span id="cb175-8"><a href="why-model-stata.html#cb175-8" tabindex="-1"></a>23  101</span>
+<span id="cb175-9"><a href="why-model-stata.html#cb175-9" tabindex="-1"></a>29  85</span>
+<span id="cb175-10"><a href="why-model-stata.html#cb175-10" tabindex="-1"></a>37  65</span>
+<span id="cb175-11"><a href="why-model-stata.html#cb175-11" tabindex="-1"></a>41  157</span>
+<span id="cb175-12"><a href="why-model-stata.html#cb175-12" tabindex="-1"></a>53  120</span>
+<span id="cb175-13"><a href="why-model-stata.html#cb175-13" tabindex="-1"></a>67  111</span>
+<span id="cb175-14"><a href="why-model-stata.html#cb175-14" tabindex="-1"></a>79  200</span>
+<span id="cb175-15"><a href="why-model-stata.html#cb175-15" tabindex="-1"></a>83  140</span>
+<span id="cb175-16"><a href="why-model-stata.html#cb175-16" tabindex="-1"></a>97  220</span>
+<span id="cb175-17"><a href="why-model-stata.html#cb175-17" tabindex="-1"></a>60  230</span>
+<span id="cb175-18"><a href="why-model-stata.html#cb175-18" tabindex="-1"></a>71  217</span>
+<span id="cb175-19"><a href="why-model-stata.html#cb175-19" tabindex="-1"></a>15  11</span>
+<span id="cb175-20"><a href="why-model-stata.html#cb175-20" tabindex="-1"></a>45  190</span>
+<span id="cb175-21"><a href="why-model-stata.html#cb175-21" tabindex="-1"></a><span class="kw">end</span></span>
+<span id="cb175-22"><a href="why-model-stata.html#cb175-22" tabindex="-1"></a></span>
+<span id="cb175-23"><a href="why-model-stata.html#cb175-23" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">save</span> ./<span class="kw">data</span>/fig3, <span class="kw">replace</span></span>
+<span id="cb175-24"><a href="why-model-stata.html#cb175-24" tabindex="-1"></a></span>
+<span id="cb175-25"><a href="why-model-stata.html#cb175-25" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100))</span>
+<span id="cb175-26"><a href="why-model-stata.html#cb175-26" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-3.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>             A          Y
   1. 3   21  
   2. 11      54
@@ -530,22 +530,22 @@ <h2>Program 11.2<a href="why-model-stata.html#program-11.2-1" class="anchor-sect
 <li>2-parameter linear model</li>
 <li>Creates Figure 11.4, parameter estimates with 95% confidence intervals from Section 11.2, and parameter estimates with 95% confidence intervals from Section 11.3</li>
 </ul>
-<div class="sourceCode" id="cb60"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb60-1"><a href="why-model-stata.html#cb60-1" tabindex="-1"></a>**Section 11.2: parametric estimators**</span>
-<span id="cb60-2"><a href="why-model-stata.html#cb60-2" tabindex="-1"></a>*Reload <span class="kw">data</span></span>
-<span id="cb60-3"><a href="why-model-stata.html#cb60-3" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig3, <span class="kw">clear</span></span>
-<span id="cb60-4"><a href="why-model-stata.html#cb60-4" tabindex="-1"></a></span>
-<span id="cb60-5"><a href="why-model-stata.html#cb60-5" tabindex="-1"></a>*Plot the <span class="kw">data</span>*</span>
-<span id="cb60-6"><a href="why-model-stata.html#cb60-6" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100))</span>
-<span id="cb60-7"><a href="why-model-stata.html#cb60-7" tabindex="-1"></a></span>
-<span id="cb60-8"><a href="why-model-stata.html#cb60-8" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
-<span id="cb60-9"><a href="why-model-stata.html#cb60-9" tabindex="-1"></a><span class="kw">regress</span> Y A, <span class="kw">noheader</span> cformat(%5.2f)</span>
-<span id="cb60-10"><a href="why-model-stata.html#cb60-10" tabindex="-1"></a></span>
-<span id="cb60-11"><a href="why-model-stata.html#cb60-11" tabindex="-1"></a>*Output the estimated <span class="kw">mean</span> Y <span class="ot">value</span> when A = 90*</span>
-<span id="cb60-12"><a href="why-model-stata.html#cb60-12" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 90*_b[A]</span>
-<span id="cb60-13"><a href="why-model-stata.html#cb60-13" tabindex="-1"></a></span>
-<span id="cb60-14"><a href="why-model-stata.html#cb60-14" tabindex="-1"></a>*Plot the <span class="kw">data</span> with the regression <span class="kw">line</span>: Fig 11.4*</span>
-<span id="cb60-15"><a href="why-model-stata.html#cb60-15" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100)) || <span class="kw">lfit</span> Y A</span>
-<span id="cb60-16"><a href="why-model-stata.html#cb60-16" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-4.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb177"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb177-1"><a href="why-model-stata.html#cb177-1" tabindex="-1"></a>**Section 11.2: parametric estimators**</span>
+<span id="cb177-2"><a href="why-model-stata.html#cb177-2" tabindex="-1"></a>*Reload <span class="kw">data</span></span>
+<span id="cb177-3"><a href="why-model-stata.html#cb177-3" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig3, <span class="kw">clear</span></span>
+<span id="cb177-4"><a href="why-model-stata.html#cb177-4" tabindex="-1"></a></span>
+<span id="cb177-5"><a href="why-model-stata.html#cb177-5" tabindex="-1"></a>*Plot the <span class="kw">data</span>*</span>
+<span id="cb177-6"><a href="why-model-stata.html#cb177-6" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100))</span>
+<span id="cb177-7"><a href="why-model-stata.html#cb177-7" tabindex="-1"></a></span>
+<span id="cb177-8"><a href="why-model-stata.html#cb177-8" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
+<span id="cb177-9"><a href="why-model-stata.html#cb177-9" tabindex="-1"></a><span class="kw">regress</span> Y A, <span class="kw">noheader</span> cformat(%5.2f)</span>
+<span id="cb177-10"><a href="why-model-stata.html#cb177-10" tabindex="-1"></a></span>
+<span id="cb177-11"><a href="why-model-stata.html#cb177-11" tabindex="-1"></a>*Output the estimated <span class="kw">mean</span> Y <span class="ot">value</span> when A = 90*</span>
+<span id="cb177-12"><a href="why-model-stata.html#cb177-12" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 90*_b[A]</span>
+<span id="cb177-13"><a href="why-model-stata.html#cb177-13" tabindex="-1"></a></span>
+<span id="cb177-14"><a href="why-model-stata.html#cb177-14" tabindex="-1"></a>*Plot the <span class="kw">data</span> with the regression <span class="kw">line</span>: Fig 11.4*</span>
+<span id="cb177-15"><a href="why-model-stata.html#cb177-15" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100)) || <span class="kw">lfit</span> Y A</span>
+<span id="cb177-16"><a href="why-model-stata.html#cb177-16" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-4.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>           Y | Coefficient  Std. err.      t    P&gt;|t|     [95% conf. interval]
 -------------+----------------------------------------------------------------
            A |       2.14       0.40     5.35   0.000         1.28        2.99
@@ -561,15 +561,15 @@ <h2>Program 11.2<a href="why-model-stata.html#program-11.2-1" class="anchor-sect
          (1) |     216.89    20.8614    10.40   0.000     172.1468    261.6333
 ------------------------------------------------------------------------------</code></pre>
 <p><img src="figs/stata-fig-11-4.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb62"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb62-1"><a href="why-model-stata.html#cb62-1" tabindex="-1"></a>**Section 11.3: non-parametric estimation*</span>
-<span id="cb62-2"><a href="why-model-stata.html#cb62-2" tabindex="-1"></a>* Reload the <span class="kw">data</span></span>
-<span id="cb62-3"><a href="why-model-stata.html#cb62-3" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig1, <span class="kw">clear</span></span>
-<span id="cb62-4"><a href="why-model-stata.html#cb62-4" tabindex="-1"></a></span>
-<span id="cb62-5"><a href="why-model-stata.html#cb62-5" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
-<span id="cb62-6"><a href="why-model-stata.html#cb62-6" tabindex="-1"></a><span class="kw">regress</span> Y A, <span class="kw">noheader</span> cformat(%5.2f)</span>
-<span id="cb62-7"><a href="why-model-stata.html#cb62-7" tabindex="-1"></a></span>
-<span id="cb62-8"><a href="why-model-stata.html#cb62-8" tabindex="-1"></a>*E[Y|A=1]*</span>
-<span id="cb62-9"><a href="why-model-stata.html#cb62-9" tabindex="-1"></a><span class="kw">di</span> 67.50 + 78.75</span></code></pre></div>
+<div class="sourceCode" id="cb179"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb179-1"><a href="why-model-stata.html#cb179-1" tabindex="-1"></a>**Section 11.3: non-parametric estimation*</span>
+<span id="cb179-2"><a href="why-model-stata.html#cb179-2" tabindex="-1"></a>* Reload the <span class="kw">data</span></span>
+<span id="cb179-3"><a href="why-model-stata.html#cb179-3" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig1, <span class="kw">clear</span></span>
+<span id="cb179-4"><a href="why-model-stata.html#cb179-4" tabindex="-1"></a></span>
+<span id="cb179-5"><a href="why-model-stata.html#cb179-5" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
+<span id="cb179-6"><a href="why-model-stata.html#cb179-6" tabindex="-1"></a><span class="kw">regress</span> Y A, <span class="kw">noheader</span> cformat(%5.2f)</span>
+<span id="cb179-7"><a href="why-model-stata.html#cb179-7" tabindex="-1"></a></span>
+<span id="cb179-8"><a href="why-model-stata.html#cb179-8" tabindex="-1"></a>*E[Y|A=1]*</span>
+<span id="cb179-9"><a href="why-model-stata.html#cb179-9" tabindex="-1"></a><span class="kw">di</span> 67.50 + 78.75</span></code></pre></div>
 <pre><code>           Y | Coefficient  Std. err.      t    P&gt;|t|     [95% conf. interval]
 -------------+----------------------------------------------------------------
            A |      78.75      27.88     2.82   0.014        18.95      138.55
@@ -584,21 +584,21 @@ <h2>Program 11.3<a href="why-model-stata.html#program-11.3-1" class="anchor-sect
 <li>3-parameter linear model</li>
 <li>Creates Figure 11.5 and Parameter estimates for Section 11.4</li>
 </ul>
-<div class="sourceCode" id="cb64"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb64-1"><a href="why-model-stata.html#cb64-1" tabindex="-1"></a>* Reload the <span class="kw">data</span></span>
-<span id="cb64-2"><a href="why-model-stata.html#cb64-2" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig3, <span class="kw">clear</span></span>
-<span id="cb64-3"><a href="why-model-stata.html#cb64-3" tabindex="-1"></a></span>
-<span id="cb64-4"><a href="why-model-stata.html#cb64-4" tabindex="-1"></a>*Create the product term*</span>
-<span id="cb64-5"><a href="why-model-stata.html#cb64-5" tabindex="-1"></a><span class="kw">gen</span> Asq = A*A</span>
-<span id="cb64-6"><a href="why-model-stata.html#cb64-6" tabindex="-1"></a></span>
-<span id="cb64-7"><a href="why-model-stata.html#cb64-7" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
-<span id="cb64-8"><a href="why-model-stata.html#cb64-8" tabindex="-1"></a><span class="kw">regress</span> Y A Asq, <span class="kw">noheader</span> cformat(%5.2f)</span>
-<span id="cb64-9"><a href="why-model-stata.html#cb64-9" tabindex="-1"></a></span>
-<span id="cb64-10"><a href="why-model-stata.html#cb64-10" tabindex="-1"></a>*Output the estimated <span class="kw">mean</span> Y <span class="ot">value</span> when A = 90*</span>
-<span id="cb64-11"><a href="why-model-stata.html#cb64-11" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 90*_b[A] + 90*90*_b[Asq]</span>
-<span id="cb64-12"><a href="why-model-stata.html#cb64-12" tabindex="-1"></a></span>
-<span id="cb64-13"><a href="why-model-stata.html#cb64-13" tabindex="-1"></a>*Plot the <span class="kw">data</span> with the regression <span class="kw">line</span>: Fig 11.5*</span>
-<span id="cb64-14"><a href="why-model-stata.html#cb64-14" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100)) || qfit Y A</span>
-<span id="cb64-15"><a href="why-model-stata.html#cb64-15" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-5.png, <span class="kw">replace</span></span></code></pre></div>
+<div class="sourceCode" id="cb181"><pre class="sourceCode stata"><code class="sourceCode stata"><span id="cb181-1"><a href="why-model-stata.html#cb181-1" tabindex="-1"></a>* Reload the <span class="kw">data</span></span>
+<span id="cb181-2"><a href="why-model-stata.html#cb181-2" tabindex="-1"></a><span class="kw">use</span> ./<span class="kw">data</span>/fig3, <span class="kw">clear</span></span>
+<span id="cb181-3"><a href="why-model-stata.html#cb181-3" tabindex="-1"></a></span>
+<span id="cb181-4"><a href="why-model-stata.html#cb181-4" tabindex="-1"></a>*Create the product term*</span>
+<span id="cb181-5"><a href="why-model-stata.html#cb181-5" tabindex="-1"></a><span class="kw">gen</span> Asq = A*A</span>
+<span id="cb181-6"><a href="why-model-stata.html#cb181-6" tabindex="-1"></a></span>
+<span id="cb181-7"><a href="why-model-stata.html#cb181-7" tabindex="-1"></a>*Fit the regression <span class="kw">model</span>*</span>
+<span id="cb181-8"><a href="why-model-stata.html#cb181-8" tabindex="-1"></a><span class="kw">regress</span> Y A Asq, <span class="kw">noheader</span> cformat(%5.2f)</span>
+<span id="cb181-9"><a href="why-model-stata.html#cb181-9" tabindex="-1"></a></span>
+<span id="cb181-10"><a href="why-model-stata.html#cb181-10" tabindex="-1"></a>*Output the estimated <span class="kw">mean</span> Y <span class="ot">value</span> when A = 90*</span>
+<span id="cb181-11"><a href="why-model-stata.html#cb181-11" tabindex="-1"></a><span class="kw">lincom</span> _b[<span class="dt">_cons</span>] + 90*_b[A] + 90*90*_b[Asq]</span>
+<span id="cb181-12"><a href="why-model-stata.html#cb181-12" tabindex="-1"></a></span>
+<span id="cb181-13"><a href="why-model-stata.html#cb181-13" tabindex="-1"></a>*Plot the <span class="kw">data</span> with the regression <span class="kw">line</span>: Fig 11.5*</span>
+<span id="cb181-14"><a href="why-model-stata.html#cb181-14" tabindex="-1"></a><span class="kw">scatter</span> Y A, ylab(0(50)250) xlab(0(10)100) <span class="bn">xscale</span>(<span class="kw">range</span>(0 100)) || qfit Y A</span>
+<span id="cb181-15"><a href="why-model-stata.html#cb181-15" tabindex="-1"></a><span class="kw">qui</span> <span class="kw">gr</span> <span class="kw">export</span> figs/stata-fig-11-5.png, <span class="kw">replace</span></span></code></pre></div>
 <pre><code>           Y | Coefficient  Std. err.      t    P&gt;|t|     [95% conf. interval]
 -------------+----------------------------------------------------------------
            A |       4.11       1.53     2.68   0.019         0.80        7.41
diff --git a/docs/why-model.html b/docs/why-model.html
index 5755248..aeef2c9 100644
--- a/docs/why-model.html
+++ b/docs/why-model.html
@@ -26,7 +26,7 @@
 <meta name="author" content="R Markdown code by Tom Palmer" />
 
 
-<meta name="date" content="2024-04-25" />
+<meta name="date" content="2024-06-16" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -324,29 +324,29 @@ <h2>Program 11.1<a href="why-model.html#program-11.1" class="anchor-section" ari
 <p><img src="11-why-model-r_files/figure-html/unnamed-chunk-1-1.png" width="85%" style="display: block; margin: auto;" /></p>
 <div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="why-model.html#cb5-1" tabindex="-1"></a><span class="fu">summary</span>(Y[A <span class="sc">==</span> <span class="dv">0</span>])</span>
 <span id="cb5-2"><a href="why-model.html#cb5-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb5-3"><a href="why-model.html#cb5-3" tabindex="-1"></a><span class="co">#&gt;    10.0    27.5    60.0    67.5    87.5   170.0</span></span>
-<span id="cb5-4"><a href="why-model.html#cb5-4" tabindex="-1"></a><span class="fu">summary</span>(Y[A <span class="sc">==</span> <span class="dv">1</span>])</span>
-<span id="cb5-5"><a href="why-model.html#cb5-5" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb5-6"><a href="why-model.html#cb5-6" tabindex="-1"></a><span class="co">#&gt;    50.0   105.0   160.0   146.2   185.0   220.0</span></span>
-<span id="cb5-7"><a href="why-model.html#cb5-7" tabindex="-1"></a></span>
-<span id="cb5-8"><a href="why-model.html#cb5-8" tabindex="-1"></a>A2 <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">4</span>, <span class="dv">4</span>, <span class="dv">4</span>, <span class="dv">4</span>)</span>
-<span id="cb5-9"><a href="why-model.html#cb5-9" tabindex="-1"></a>Y2 <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">110</span>, <span class="dv">80</span>, <span class="dv">50</span>, <span class="dv">40</span>, <span class="dv">170</span>, <span class="dv">30</span>, <span class="dv">70</span>, <span class="dv">50</span>, <span class="dv">110</span>, <span class="dv">50</span>, <span class="dv">180</span>,</span>
-<span id="cb5-10"><a href="why-model.html#cb5-10" tabindex="-1"></a>        <span class="dv">130</span>, <span class="dv">200</span>, <span class="dv">150</span>, <span class="dv">220</span>, <span class="dv">210</span>)</span>
-<span id="cb5-11"><a href="why-model.html#cb5-11" tabindex="-1"></a></span>
-<span id="cb5-12"><a href="why-model.html#cb5-12" tabindex="-1"></a><span class="fu">plot</span>(A2, Y2)</span></code></pre></div>
-<p><img src="11-why-model-r_files/figure-html/unnamed-chunk-1-2.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb6"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb6-1"><a href="why-model.html#cb6-1" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">1</span>])</span>
+<span id="cb5-3"><a href="why-model.html#cb5-3" tabindex="-1"></a><span class="co">#&gt;    10.0    27.5    60.0    67.5    87.5   170.0</span></span></code></pre></div>
+<div class="sourceCode" id="cb6"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb6-1"><a href="why-model.html#cb6-1" tabindex="-1"></a><span class="fu">summary</span>(Y[A <span class="sc">==</span> <span class="dv">1</span>])</span>
 <span id="cb6-2"><a href="why-model.html#cb6-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb6-3"><a href="why-model.html#cb6-3" tabindex="-1"></a><span class="co">#&gt;    40.0    47.5    65.0    70.0    87.5   110.0</span></span>
-<span id="cb6-4"><a href="why-model.html#cb6-4" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">2</span>])</span>
-<span id="cb6-5"><a href="why-model.html#cb6-5" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb6-6"><a href="why-model.html#cb6-6" tabindex="-1"></a><span class="co">#&gt;      30      45      60      80      95     170</span></span>
-<span id="cb6-7"><a href="why-model.html#cb6-7" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">3</span>])</span>
-<span id="cb6-8"><a href="why-model.html#cb6-8" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb6-9"><a href="why-model.html#cb6-9" tabindex="-1"></a><span class="co">#&gt;    50.0    95.0   120.0   117.5   142.5   180.0</span></span>
-<span id="cb6-10"><a href="why-model.html#cb6-10" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">4</span>])</span>
-<span id="cb6-11"><a href="why-model.html#cb6-11" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
-<span id="cb6-12"><a href="why-model.html#cb6-12" tabindex="-1"></a><span class="co">#&gt;   150.0   187.5   205.0   195.0   212.5   220.0</span></span></code></pre></div>
+<span id="cb6-3"><a href="why-model.html#cb6-3" tabindex="-1"></a><span class="co">#&gt;    50.0   105.0   160.0   146.2   185.0   220.0</span></span></code></pre></div>
+<div class="sourceCode" id="cb7"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb7-1"><a href="why-model.html#cb7-1" tabindex="-1"></a></span>
+<span id="cb7-2"><a href="why-model.html#cb7-2" tabindex="-1"></a>A2 <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">2</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">3</span>, <span class="dv">4</span>, <span class="dv">4</span>, <span class="dv">4</span>, <span class="dv">4</span>)</span>
+<span id="cb7-3"><a href="why-model.html#cb7-3" tabindex="-1"></a>Y2 <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">110</span>, <span class="dv">80</span>, <span class="dv">50</span>, <span class="dv">40</span>, <span class="dv">170</span>, <span class="dv">30</span>, <span class="dv">70</span>, <span class="dv">50</span>, <span class="dv">110</span>, <span class="dv">50</span>, <span class="dv">180</span>,</span>
+<span id="cb7-4"><a href="why-model.html#cb7-4" tabindex="-1"></a>        <span class="dv">130</span>, <span class="dv">200</span>, <span class="dv">150</span>, <span class="dv">220</span>, <span class="dv">210</span>)</span>
+<span id="cb7-5"><a href="why-model.html#cb7-5" tabindex="-1"></a></span>
+<span id="cb7-6"><a href="why-model.html#cb7-6" tabindex="-1"></a><span class="fu">plot</span>(A2, Y2)</span></code></pre></div>
+<p><img src="11-why-model-r_files/figure-html/unnamed-chunk-1-2.png" width="85%" style="display: block; margin: auto;" /></p>
+<div class="sourceCode" id="cb8"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb8-1"><a href="why-model.html#cb8-1" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">1</span>])</span>
+<span id="cb8-2"><a href="why-model.html#cb8-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb8-3"><a href="why-model.html#cb8-3" tabindex="-1"></a><span class="co">#&gt;    40.0    47.5    65.0    70.0    87.5   110.0</span></span></code></pre></div>
+<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb9-1"><a href="why-model.html#cb9-1" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">2</span>])</span>
+<span id="cb9-2"><a href="why-model.html#cb9-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb9-3"><a href="why-model.html#cb9-3" tabindex="-1"></a><span class="co">#&gt;      30      45      60      80      95     170</span></span></code></pre></div>
+<div class="sourceCode" id="cb10"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb10-1"><a href="why-model.html#cb10-1" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">3</span>])</span>
+<span id="cb10-2"><a href="why-model.html#cb10-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb10-3"><a href="why-model.html#cb10-3" tabindex="-1"></a><span class="co">#&gt;    50.0    95.0   120.0   117.5   142.5   180.0</span></span></code></pre></div>
+<div class="sourceCode" id="cb11"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb11-1"><a href="why-model.html#cb11-1" tabindex="-1"></a><span class="fu">summary</span>(Y2[A2 <span class="sc">==</span> <span class="dv">4</span>])</span>
+<span id="cb11-2"><a href="why-model.html#cb11-2" tabindex="-1"></a><span class="co">#&gt;    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. </span></span>
+<span id="cb11-3"><a href="why-model.html#cb11-3" tabindex="-1"></a><span class="co">#&gt;   150.0   187.5   205.0   195.0   212.5   220.0</span></span></code></pre></div>
 </div>
 <div id="program-11.2" class="section level2 hasAnchor">
 <h2>Program 11.2<a href="why-model.html#program-11.2" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -354,57 +354,57 @@ <h2>Program 11.2<a href="why-model.html#program-11.2" class="anchor-section" ari
 <li>2-parameter linear model</li>
 <li>Data from Figures 11.3 and 11.1</li>
 </ul>
-<div class="sourceCode" id="cb7"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb7-1"><a href="why-model.html#cb7-1" tabindex="-1"></a>A3 <span class="ot">&lt;-</span></span>
-<span id="cb7-2"><a href="why-model.html#cb7-2" tabindex="-1"></a>  <span class="fu">c</span>(<span class="dv">3</span>, <span class="dv">11</span>, <span class="dv">17</span>, <span class="dv">23</span>, <span class="dv">29</span>, <span class="dv">37</span>, <span class="dv">41</span>, <span class="dv">53</span>, <span class="dv">67</span>, <span class="dv">79</span>, <span class="dv">83</span>, <span class="dv">97</span>, <span class="dv">60</span>, <span class="dv">71</span>, <span class="dv">15</span>, <span class="dv">45</span>)</span>
-<span id="cb7-3"><a href="why-model.html#cb7-3" tabindex="-1"></a>Y3 <span class="ot">&lt;-</span></span>
-<span id="cb7-4"><a href="why-model.html#cb7-4" tabindex="-1"></a>  <span class="fu">c</span>(<span class="dv">21</span>, <span class="dv">54</span>, <span class="dv">33</span>, <span class="dv">101</span>, <span class="dv">85</span>, <span class="dv">65</span>, <span class="dv">157</span>, <span class="dv">120</span>, <span class="dv">111</span>, <span class="dv">200</span>, <span class="dv">140</span>, <span class="dv">220</span>, <span class="dv">230</span>, <span class="dv">217</span>,</span>
-<span id="cb7-5"><a href="why-model.html#cb7-5" tabindex="-1"></a>    <span class="dv">11</span>, <span class="dv">190</span>)</span>
-<span id="cb7-6"><a href="why-model.html#cb7-6" tabindex="-1"></a></span>
-<span id="cb7-7"><a href="why-model.html#cb7-7" tabindex="-1"></a><span class="fu">plot</span>(Y3 <span class="sc">~</span> A3)</span></code></pre></div>
+<div class="sourceCode" id="cb12"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb12-1"><a href="why-model.html#cb12-1" tabindex="-1"></a>A3 <span class="ot">&lt;-</span></span>
+<span id="cb12-2"><a href="why-model.html#cb12-2" tabindex="-1"></a>  <span class="fu">c</span>(<span class="dv">3</span>, <span class="dv">11</span>, <span class="dv">17</span>, <span class="dv">23</span>, <span class="dv">29</span>, <span class="dv">37</span>, <span class="dv">41</span>, <span class="dv">53</span>, <span class="dv">67</span>, <span class="dv">79</span>, <span class="dv">83</span>, <span class="dv">97</span>, <span class="dv">60</span>, <span class="dv">71</span>, <span class="dv">15</span>, <span class="dv">45</span>)</span>
+<span id="cb12-3"><a href="why-model.html#cb12-3" tabindex="-1"></a>Y3 <span class="ot">&lt;-</span></span>
+<span id="cb12-4"><a href="why-model.html#cb12-4" tabindex="-1"></a>  <span class="fu">c</span>(<span class="dv">21</span>, <span class="dv">54</span>, <span class="dv">33</span>, <span class="dv">101</span>, <span class="dv">85</span>, <span class="dv">65</span>, <span class="dv">157</span>, <span class="dv">120</span>, <span class="dv">111</span>, <span class="dv">200</span>, <span class="dv">140</span>, <span class="dv">220</span>, <span class="dv">230</span>, <span class="dv">217</span>,</span>
+<span id="cb12-5"><a href="why-model.html#cb12-5" tabindex="-1"></a>    <span class="dv">11</span>, <span class="dv">190</span>)</span>
+<span id="cb12-6"><a href="why-model.html#cb12-6" tabindex="-1"></a></span>
+<span id="cb12-7"><a href="why-model.html#cb12-7" tabindex="-1"></a><span class="fu">plot</span>(Y3 <span class="sc">~</span> A3)</span></code></pre></div>
 <p><img src="11-why-model-r_files/figure-html/unnamed-chunk-2-1.png" width="85%" style="display: block; margin: auto;" /></p>
-<div class="sourceCode" id="cb8"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb8-1"><a href="why-model.html#cb8-1" tabindex="-1"></a></span>
-<span id="cb8-2"><a href="why-model.html#cb8-2" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">glm</span>(Y3 <span class="sc">~</span> A3))</span>
-<span id="cb8-3"><a href="why-model.html#cb8-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-4"><a href="why-model.html#cb8-4" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb8-5"><a href="why-model.html#cb8-5" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y3 ~ A3)</span></span>
-<span id="cb8-6"><a href="why-model.html#cb8-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-7"><a href="why-model.html#cb8-7" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb8-8"><a href="why-model.html#cb8-8" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
-<span id="cb8-9"><a href="why-model.html#cb8-9" tabindex="-1"></a><span class="co">#&gt; (Intercept)  24.5464    21.3300   1.151 0.269094    </span></span>
-<span id="cb8-10"><a href="why-model.html#cb8-10" tabindex="-1"></a><span class="co">#&gt; A3            2.1372     0.3997   5.347 0.000103 ***</span></span>
-<span id="cb8-11"><a href="why-model.html#cb8-11" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb8-12"><a href="why-model.html#cb8-12" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb8-13"><a href="why-model.html#cb8-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-14"><a href="why-model.html#cb8-14" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 1944.109)</span></span>
-<span id="cb8-15"><a href="why-model.html#cb8-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-16"><a href="why-model.html#cb8-16" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 82800  on 15  degrees of freedom</span></span>
-<span id="cb8-17"><a href="why-model.html#cb8-17" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 27218  on 14  degrees of freedom</span></span>
-<span id="cb8-18"><a href="why-model.html#cb8-18" tabindex="-1"></a><span class="co">#&gt; AIC: 170.43</span></span>
-<span id="cb8-19"><a href="why-model.html#cb8-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-20"><a href="why-model.html#cb8-20" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb8-21"><a href="why-model.html#cb8-21" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">glm</span>(Y3 <span class="sc">~</span> A3), <span class="fu">data.frame</span>(<span class="at">A3 =</span> <span class="dv">90</span>))</span>
-<span id="cb8-22"><a href="why-model.html#cb8-22" tabindex="-1"></a><span class="co">#&gt;      1 </span></span>
-<span id="cb8-23"><a href="why-model.html#cb8-23" tabindex="-1"></a><span class="co">#&gt; 216.89</span></span>
-<span id="cb8-24"><a href="why-model.html#cb8-24" tabindex="-1"></a></span>
-<span id="cb8-25"><a href="why-model.html#cb8-25" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">glm</span>(Y <span class="sc">~</span> A))</span>
-<span id="cb8-26"><a href="why-model.html#cb8-26" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-27"><a href="why-model.html#cb8-27" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb8-28"><a href="why-model.html#cb8-28" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y ~ A)</span></span>
-<span id="cb8-29"><a href="why-model.html#cb8-29" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-30"><a href="why-model.html#cb8-30" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb8-31"><a href="why-model.html#cb8-31" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)   </span></span>
-<span id="cb8-32"><a href="why-model.html#cb8-32" tabindex="-1"></a><span class="co">#&gt; (Intercept)    67.50      19.72   3.424  0.00412 **</span></span>
-<span id="cb8-33"><a href="why-model.html#cb8-33" tabindex="-1"></a><span class="co">#&gt; A              78.75      27.88   2.824  0.01352 * </span></span>
-<span id="cb8-34"><a href="why-model.html#cb8-34" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb8-35"><a href="why-model.html#cb8-35" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb8-36"><a href="why-model.html#cb8-36" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-37"><a href="why-model.html#cb8-37" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 3109.821)</span></span>
-<span id="cb8-38"><a href="why-model.html#cb8-38" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-39"><a href="why-model.html#cb8-39" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 68344  on 15  degrees of freedom</span></span>
-<span id="cb8-40"><a href="why-model.html#cb8-40" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 43538  on 14  degrees of freedom</span></span>
-<span id="cb8-41"><a href="why-model.html#cb8-41" tabindex="-1"></a><span class="co">#&gt; AIC: 177.95</span></span>
-<span id="cb8-42"><a href="why-model.html#cb8-42" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb8-43"><a href="why-model.html#cb8-43" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb13"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb13-1"><a href="why-model.html#cb13-1" tabindex="-1"></a></span>
+<span id="cb13-2"><a href="why-model.html#cb13-2" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">glm</span>(Y3 <span class="sc">~</span> A3))</span>
+<span id="cb13-3"><a href="why-model.html#cb13-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb13-4"><a href="why-model.html#cb13-4" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb13-5"><a href="why-model.html#cb13-5" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y3 ~ A3)</span></span>
+<span id="cb13-6"><a href="why-model.html#cb13-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb13-7"><a href="why-model.html#cb13-7" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb13-8"><a href="why-model.html#cb13-8" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)    </span></span>
+<span id="cb13-9"><a href="why-model.html#cb13-9" tabindex="-1"></a><span class="co">#&gt; (Intercept)  24.5464    21.3300   1.151 0.269094    </span></span>
+<span id="cb13-10"><a href="why-model.html#cb13-10" tabindex="-1"></a><span class="co">#&gt; A3            2.1372     0.3997   5.347 0.000103 ***</span></span>
+<span id="cb13-11"><a href="why-model.html#cb13-11" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb13-12"><a href="why-model.html#cb13-12" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb13-13"><a href="why-model.html#cb13-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb13-14"><a href="why-model.html#cb13-14" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 1944.109)</span></span>
+<span id="cb13-15"><a href="why-model.html#cb13-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb13-16"><a href="why-model.html#cb13-16" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 82800  on 15  degrees of freedom</span></span>
+<span id="cb13-17"><a href="why-model.html#cb13-17" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 27218  on 14  degrees of freedom</span></span>
+<span id="cb13-18"><a href="why-model.html#cb13-18" tabindex="-1"></a><span class="co">#&gt; AIC: 170.43</span></span>
+<span id="cb13-19"><a href="why-model.html#cb13-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb13-20"><a href="why-model.html#cb13-20" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb14"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb14-1"><a href="why-model.html#cb14-1" tabindex="-1"></a><span class="fu">predict</span>(<span class="fu">glm</span>(Y3 <span class="sc">~</span> A3), <span class="fu">data.frame</span>(<span class="at">A3 =</span> <span class="dv">90</span>))</span>
+<span id="cb14-2"><a href="why-model.html#cb14-2" tabindex="-1"></a><span class="co">#&gt;      1 </span></span>
+<span id="cb14-3"><a href="why-model.html#cb14-3" tabindex="-1"></a><span class="co">#&gt; 216.89</span></span></code></pre></div>
+<div class="sourceCode" id="cb15"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb15-1"><a href="why-model.html#cb15-1" tabindex="-1"></a></span>
+<span id="cb15-2"><a href="why-model.html#cb15-2" tabindex="-1"></a><span class="fu">summary</span>(<span class="fu">glm</span>(Y <span class="sc">~</span> A))</span>
+<span id="cb15-3"><a href="why-model.html#cb15-3" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb15-4"><a href="why-model.html#cb15-4" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb15-5"><a href="why-model.html#cb15-5" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y ~ A)</span></span>
+<span id="cb15-6"><a href="why-model.html#cb15-6" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb15-7"><a href="why-model.html#cb15-7" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb15-8"><a href="why-model.html#cb15-8" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)   </span></span>
+<span id="cb15-9"><a href="why-model.html#cb15-9" tabindex="-1"></a><span class="co">#&gt; (Intercept)    67.50      19.72   3.424  0.00412 **</span></span>
+<span id="cb15-10"><a href="why-model.html#cb15-10" tabindex="-1"></a><span class="co">#&gt; A              78.75      27.88   2.824  0.01352 * </span></span>
+<span id="cb15-11"><a href="why-model.html#cb15-11" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb15-12"><a href="why-model.html#cb15-12" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb15-13"><a href="why-model.html#cb15-13" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb15-14"><a href="why-model.html#cb15-14" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 3109.821)</span></span>
+<span id="cb15-15"><a href="why-model.html#cb15-15" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb15-16"><a href="why-model.html#cb15-16" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 68344  on 15  degrees of freedom</span></span>
+<span id="cb15-17"><a href="why-model.html#cb15-17" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 43538  on 14  degrees of freedom</span></span>
+<span id="cb15-18"><a href="why-model.html#cb15-18" tabindex="-1"></a><span class="co">#&gt; AIC: 177.95</span></span>
+<span id="cb15-19"><a href="why-model.html#cb15-19" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb15-20"><a href="why-model.html#cb15-20" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
 </div>
 <div id="program-11.3" class="section level2 hasAnchor">
 <h2>Program 11.3<a href="why-model.html#program-11.3" class="anchor-section" aria-label="Anchor link to header"></a></h2>
@@ -412,32 +412,32 @@ <h2>Program 11.3<a href="why-model.html#program-11.3" class="anchor-section" ari
 <li>3-parameter linear model</li>
 <li>Data from Figure 11.3</li>
 </ul>
-<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb9-1"><a href="why-model.html#cb9-1" tabindex="-1"></a>Asq <span class="ot">&lt;-</span> A3 <span class="sc">*</span> A3</span>
-<span id="cb9-2"><a href="why-model.html#cb9-2" tabindex="-1"></a></span>
-<span id="cb9-3"><a href="why-model.html#cb9-3" tabindex="-1"></a>mod3 <span class="ot">&lt;-</span> <span class="fu">glm</span>(Y3 <span class="sc">~</span> A3 <span class="sc">+</span> Asq)</span>
-<span id="cb9-4"><a href="why-model.html#cb9-4" tabindex="-1"></a><span class="fu">summary</span>(mod3)</span>
-<span id="cb9-5"><a href="why-model.html#cb9-5" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb9-6"><a href="why-model.html#cb9-6" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
-<span id="cb9-7"><a href="why-model.html#cb9-7" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y3 ~ A3 + Asq)</span></span>
-<span id="cb9-8"><a href="why-model.html#cb9-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb9-9"><a href="why-model.html#cb9-9" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
-<span id="cb9-10"><a href="why-model.html#cb9-10" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)  </span></span>
-<span id="cb9-11"><a href="why-model.html#cb9-11" tabindex="-1"></a><span class="co">#&gt; (Intercept) -7.40688   31.74777  -0.233   0.8192  </span></span>
-<span id="cb9-12"><a href="why-model.html#cb9-12" tabindex="-1"></a><span class="co">#&gt; A3           4.10723    1.53088   2.683   0.0188 *</span></span>
-<span id="cb9-13"><a href="why-model.html#cb9-13" tabindex="-1"></a><span class="co">#&gt; Asq         -0.02038    0.01532  -1.331   0.2062  </span></span>
-<span id="cb9-14"><a href="why-model.html#cb9-14" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
-<span id="cb9-15"><a href="why-model.html#cb9-15" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
-<span id="cb9-16"><a href="why-model.html#cb9-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb9-17"><a href="why-model.html#cb9-17" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 1842.697)</span></span>
-<span id="cb9-18"><a href="why-model.html#cb9-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb9-19"><a href="why-model.html#cb9-19" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 82800  on 15  degrees of freedom</span></span>
-<span id="cb9-20"><a href="why-model.html#cb9-20" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 23955  on 13  degrees of freedom</span></span>
-<span id="cb9-21"><a href="why-model.html#cb9-21" tabindex="-1"></a><span class="co">#&gt; AIC: 170.39</span></span>
-<span id="cb9-22"><a href="why-model.html#cb9-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
-<span id="cb9-23"><a href="why-model.html#cb9-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span>
-<span id="cb9-24"><a href="why-model.html#cb9-24" tabindex="-1"></a><span class="fu">predict</span>(mod3, <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="at">A3 =</span> <span class="dv">90</span>, <span class="at">Asq =</span> <span class="dv">8100</span>)))</span>
-<span id="cb9-25"><a href="why-model.html#cb9-25" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
-<span id="cb9-26"><a href="why-model.html#cb9-26" tabindex="-1"></a><span class="co">#&gt; 197.1269</span></span></code></pre></div>
+<div class="sourceCode" id="cb16"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb16-1"><a href="why-model.html#cb16-1" tabindex="-1"></a>Asq <span class="ot">&lt;-</span> A3 <span class="sc">*</span> A3</span>
+<span id="cb16-2"><a href="why-model.html#cb16-2" tabindex="-1"></a></span>
+<span id="cb16-3"><a href="why-model.html#cb16-3" tabindex="-1"></a>mod3 <span class="ot">&lt;-</span> <span class="fu">glm</span>(Y3 <span class="sc">~</span> A3 <span class="sc">+</span> Asq)</span>
+<span id="cb16-4"><a href="why-model.html#cb16-4" tabindex="-1"></a><span class="fu">summary</span>(mod3)</span>
+<span id="cb16-5"><a href="why-model.html#cb16-5" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb16-6"><a href="why-model.html#cb16-6" tabindex="-1"></a><span class="co">#&gt; Call:</span></span>
+<span id="cb16-7"><a href="why-model.html#cb16-7" tabindex="-1"></a><span class="co">#&gt; glm(formula = Y3 ~ A3 + Asq)</span></span>
+<span id="cb16-8"><a href="why-model.html#cb16-8" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb16-9"><a href="why-model.html#cb16-9" tabindex="-1"></a><span class="co">#&gt; Coefficients:</span></span>
+<span id="cb16-10"><a href="why-model.html#cb16-10" tabindex="-1"></a><span class="co">#&gt;             Estimate Std. Error t value Pr(&gt;|t|)  </span></span>
+<span id="cb16-11"><a href="why-model.html#cb16-11" tabindex="-1"></a><span class="co">#&gt; (Intercept) -7.40688   31.74777  -0.233   0.8192  </span></span>
+<span id="cb16-12"><a href="why-model.html#cb16-12" tabindex="-1"></a><span class="co">#&gt; A3           4.10723    1.53088   2.683   0.0188 *</span></span>
+<span id="cb16-13"><a href="why-model.html#cb16-13" tabindex="-1"></a><span class="co">#&gt; Asq         -0.02038    0.01532  -1.331   0.2062  </span></span>
+<span id="cb16-14"><a href="why-model.html#cb16-14" tabindex="-1"></a><span class="co">#&gt; ---</span></span>
+<span id="cb16-15"><a href="why-model.html#cb16-15" tabindex="-1"></a><span class="co">#&gt; Signif. codes:  0 &#39;***&#39; 0.001 &#39;**&#39; 0.01 &#39;*&#39; 0.05 &#39;.&#39; 0.1 &#39; &#39; 1</span></span>
+<span id="cb16-16"><a href="why-model.html#cb16-16" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb16-17"><a href="why-model.html#cb16-17" tabindex="-1"></a><span class="co">#&gt; (Dispersion parameter for gaussian family taken to be 1842.697)</span></span>
+<span id="cb16-18"><a href="why-model.html#cb16-18" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb16-19"><a href="why-model.html#cb16-19" tabindex="-1"></a><span class="co">#&gt;     Null deviance: 82800  on 15  degrees of freedom</span></span>
+<span id="cb16-20"><a href="why-model.html#cb16-20" tabindex="-1"></a><span class="co">#&gt; Residual deviance: 23955  on 13  degrees of freedom</span></span>
+<span id="cb16-21"><a href="why-model.html#cb16-21" tabindex="-1"></a><span class="co">#&gt; AIC: 170.39</span></span>
+<span id="cb16-22"><a href="why-model.html#cb16-22" tabindex="-1"></a><span class="co">#&gt; </span></span>
+<span id="cb16-23"><a href="why-model.html#cb16-23" tabindex="-1"></a><span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></span></code></pre></div>
+<div class="sourceCode" id="cb17"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb17-1"><a href="why-model.html#cb17-1" tabindex="-1"></a><span class="fu">predict</span>(mod3, <span class="fu">data.frame</span>(<span class="fu">cbind</span>(<span class="at">A3 =</span> <span class="dv">90</span>, <span class="at">Asq =</span> <span class="dv">8100</span>)))</span>
+<span id="cb17-2"><a href="why-model.html#cb17-2" tabindex="-1"></a><span class="co">#&gt;        1 </span></span>
+<span id="cb17-3"><a href="why-model.html#cb17-3" tabindex="-1"></a><span class="co">#&gt; 197.1269</span></span></code></pre></div>
 
 </div>
 </div>