r-causal
diff --git a/‎exercises/01-whole-game-exercises.Rmd‎
Lines changed: 26 additions & 34 deletions b/‎exercises/01-whole-game-exercises.Rmd‎
Lines changed: 26 additions & 34 deletions
diff --git a/‎exercises/05-pscores-diagnostics-exercises.Rmd‎
Lines changed: 0 additions & 1 deletion b/‎exercises/05-pscores-diagnostics-exercises.Rmd‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎exercises/06-outcome-model-exercises.Rmd‎
Lines changed: 0 additions & 2 deletions b/‎exercises/06-outcome-model-exercises.Rmd‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎slides/raw/01-causal_modeling_whole_game.Rmd‎
Lines changed: 29 additions & 37 deletions b/‎slides/raw/01-causal_modeling_whole_game.Rmd‎
Lines changed: 29 additions & 37 deletions
@@ -9,8 +9,6 @@ library(broom)
 library(rsample)
 library(ggdag)
 library(causaldata)
-library(survey)
-library(tableone)
 ```
 
 ## Causal Modeling: Whole Game
@@ -194,45 +192,39 @@ The main goal here is to *break* the non-causal associations between quitting sm
 
 Standardized mean differences (SMD) are a simple measurement of differences that work across variable types. In general, the closer to 0 we are, the better job we have done eliminating the non-causal relationships we drew in our DAG. Note that low SMDs for everything we adjust for does *not* mean that there is not something else that might confound our study. Unmeasured confounders or misspecified DAGs can still distort our effects, even if our SMDs look great!
 
-We'll use the {survey} and {tableone} package to calculate the SMDs, then visualize them.
+We'll use the {smd}t package to calculate the SMDs, then visualize them.
 
 ```{r}
-svy_des <- svydesign(
-  ids = ~ 1,
-  data = nhefs_complete_uc,
-  weights = ~ wts)
-
-smd_table_unweighted <- CreateTableOne(
-  vars = c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
-           "exercise", "active", "wt71"),
-  strata = "qsmk",
-  data = nhefs_complete_uc,
-  test = FALSE)
-
-smd_table <- svyCreateTableOne(
-  vars = c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
-           "exercise", "active", "wt71"),
-  strata = "qsmk",
-  data = svy_des,
-  test = FALSE)
-
-
-plot_df <- data.frame(
-  var = rownames(ExtractSmd(smd_table)),                        
-  Unadjusted = as.numeric(ExtractSmd(smd_table_unweighted)),                      
-  Weighted = as.numeric(ExtractSmd(smd_table))) %>%
-  pivot_longer(-var, names_to = "Method", values_to = "SMD")
+vars <- c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
+          "exercise", "active", "wt71")
+
+plot_df <- nhefs_complete_uc %>% 
+  summarise(
+    across(
+      all_of(vars), 
+      list(
+        unweighted = ~smd(.x, qsmk)$estimate, 
+        weighted = ~smd(.x, qsmk, wts)$estimate
+      )
+    )
+  ) %>% 
+  pivot_longer(
+    everything(), 
+    values_to = "SMD", 
+    names_to = c("variable", "Method"),
+    names_sep = "_"
+  )
 
 ggplot(
   data = plot_df,
-  mapping = aes(x = var, y = SMD, group = Method, color = Method)
+  aes(x = abs(SMD), y = variable, group = Method, color = Method)
 ) +
-  geom_line() +
+  geom_line(orientation = "y") +
   geom_point() + 
-  geom_hline(yintercept = 0.1, color = "black", size = 0.1) +  
-  coord_flip() +
-  theme_minimal()
-
+  geom_vline(xintercept = 0.1, color = "black", size = 0.1) +
+  theme_minimal() +
+  scale_color_manual(values = c("grey85", "#00BFC4")) +
+  xlim(0, .3)
 ```
 
 These look pretty good! Some variables are better than others, but weighting appears to have done a much better job eliminating these differences than an unadjusted analysis.
 
@@ -7,7 +7,6 @@ output: html_document
 ```{r}
 library(tidyverse)
 library(survey)
-library(tableone)
 library(broom)
 library(causaldata)
 ```
 
@@ -6,8 +6,6 @@ output: html_document
 
 ```{r}
 library(tidyverse)
-library(survey)
-library(tableone)
 library(broom)
 library(causaldata)
 library(rsample)
 
@@ -22,12 +22,11 @@ class: inverse
 options(htmltools.dir.version = FALSE, tibble.max_extra_cols = 6, tibble.width = 60)
 knitr::opts_chunk$set(warning = FALSE, message = FALSE, fig.align = "center", dpi = 320, fig.height = 4)
 library(tidyverse)
+library(smd)
 library(broom)
 library(rsample)
 library(ggdag)
 library(causaldata)
-library(survey)
-library(tableone)
 ```
 
 # Broad strokes
@@ -260,60 +259,53 @@ ggplot(nhefs_complete_uc, aes(wts)) +
 ---
 
 ```{r, echo=FALSE, fig.height=5.5}
-svy_des <- svydesign(
-  ids = ~ 1,
-  data = nhefs_complete_uc,
-  weights = ~ wts)
-
-smd_table_unweighted <- CreateTableOne(
-  vars = c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
-           "exercise", "active", "wt71"),
-  strata = "qsmk",
-  data = nhefs_complete_uc,
-  test = FALSE)
-
-smd_table <- svyCreateTableOne(
-  vars = c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
-           "exercise", "active", "wt71"),
-  strata = "qsmk",
-  data = svy_des,
-  test = FALSE)
-
-plot_df <- data.frame(
-  var = rownames(ExtractSmd(smd_table)),                        
-  Unadjusted = as.numeric(ExtractSmd(smd_table_unweighted)),                      
-  Weighted = as.numeric(ExtractSmd(smd_table))) %>%
-  pivot_longer(-var, names_to = "Method", values_to = "SMD")
+vars <- c("sex", "race", "age", "education", "smokeintensity", "smokeyrs", 
+          "exercise", "active", "wt71")
+
+plot_df <- nhefs_complete_uc %>% 
+  summarise(
+    across(
+      all_of(vars), 
+      list(
+        unweighted = ~smd(.x, qsmk)$estimate, 
+        weighted = ~smd(.x, qsmk, wts)$estimate
+      )
+    )
+  ) %>% 
+  pivot_longer(
+    everything(), 
+    values_to = "SMD", 
+    names_to = c("variable", "Method"),
+    names_sep = "_"
+  )
 ```
 
 
 ```{r, echo=FALSE, fig.height=5.5}
 ggplot(
-  data = plot_df %>% filter(Method == "Unadjusted"),
-  mapping = aes(x = var, y = SMD, group = Method, color = Method)
+  data = plot_df %>% filter(Method == "unweighted"),
+  aes(x = abs(SMD), y = variable, group = Method, color = Method)
 ) +
-  geom_line() +
+  geom_line(orientation = "y") +
   geom_point() + 
-  geom_hline(yintercept = 0.1, color = "black", size = 0.1) +  
-  coord_flip() +
+  geom_vline(xintercept = 0.1, color = "black", size = 0.1) +
   theme_minimal() +
-  ylim(0, .3)
+  xlim(0, .3)
 ```
 
 ---
 
 ```{r, echo=FALSE, fig.height=5.5}
 ggplot(
   data = plot_df,
-  mapping = aes(x = var, y = SMD, group = Method, color = Method)
+  aes(x = abs(SMD), y = variable, group = Method, color = Method)
 ) +
-  geom_line() +
+  geom_line(orientation = "y") +
   geom_point() + 
-  geom_hline(yintercept = 0.1, color = "black", size = 0.1) +  
-  coord_flip() +
+  geom_vline(xintercept = 0.1, color = "black", size = 0.1) +
   theme_minimal() +
   scale_color_manual(values = c("grey85", "#00BFC4")) +
-  ylim(0, .3)
+  xlim(0, .3)
 ```
 
 ---