--- title: "Code from examples in manuscript" output: rmarkdown::html_vignette vignette: > %\VignetteIndexEntry{Code from examples in manuscript} %\VignetteEncoding{UTF-8} %\VignetteEngine{knitr::rmarkdown} editor_options: chunk_output_type: console --- ```{r, include = FALSE} knitr::opts_chunk$set( collapse = TRUE, comment = "#>" ) ``` ```{r setup} library(causaloptim) ``` ## confounded exposure and outcome ```{r} b <- initialize_graph(graph_from_literal(X -+ Y, Ur -+ X, Ur -+ Y)) V(b)$nvals <- c(3,2,2) obj <- analyze_graph(b, constraints = NULL, effectt = "p{Y(X = 1) = 1} - p{Y(X = 0) = 1}") optimize_effect_2(obj) obj2 <- analyze_graph(b, constraints = NULL, effectt = "p{Y(X = 2) = 1} - p{Y(X = 0) = 1}") optimize_effect_2(obj2) obj3 <- analyze_graph(b, constraints = NULL, effectt = "p{Y(X = 2) = 1} - p{Y(X = 1) = 1}") optimize_effect_2(obj3) ``` ## multiple instruments Not run, this takes a few minutes to compute. ```{r, eval = FALSE} b <- graph_from_literal(Z1 -+ X, Z2 -+ X, Z2 -+ Z1, Ul -+ Z1, Ul -+ Z2, X -+ Y, Ur -+ X, Ur -+ Y) V(b)$leftside <- c(1, 0, 1, 1, 0, 0) V(b)$latent <- c(0, 0, 0, 1, 0, 1) V(b)$nvals <- c(2, 2, 2, 2, 2, 2) E(b)$rlconnect <- c(0, 0, 0, 0, 0, 0, 0, 0) E(b)$edge.monotone <- c(0, 0, 0, 0, 0, 0, 0, 0) obj <- analyze_graph(b, constraints = NULL, effectt = "p{Y(X = 1) = 1} - p{Y(X = 0) = 1}") bounds.multi <- optimize_effect_2(obj) b2 <- graph_from_literal(Z1 -+ X, Ul -+ Z1, X -+ Y, Ur -+ X, Ur -+ Y) V(b2)$leftside <- c(1, 0, 1, 0, 0) V(b2)$latent <- c(0, 0, 1, 0, 1) V(b2)$nvals <- c(2, 2, 2, 2, 2) E(b2)$rlconnect <- c(0, 0, 0, 0, 0) E(b2)$edge.monotone <- c(0, 0, 0, 0, 0) ## single instrument obj2 <- analyze_graph(b2, constraints = NULL, effectt = "p{Y(X = 1) = 1} - p{Y(X = 0) = 1}") bounds.sing <- optimize_effect_2(obj2) b3 <- graph_from_literal(Z3 -+ X, Ul -+ Z3, X -+ Y, Ur -+ X, Ur -+ Y) V(b3)$leftside <- c(1, 0, 1, 0, 0) V(b3)$latent <- c(0, 0, 1, 0, 1) V(b3)$nvals <- c(4, 2, 2, 2, 2) E(b3)$rlconnect <- c(0, 0, 0, 0, 0) E(b3)$edge.monotone <- c(0, 0, 0, 0, 0) ## single instrument obj3 <- analyze_graph(b3, constraints = NULL, effectt = "p{Y(X = 1) = 1} - p{Y(X = 0) = 1}") bounds.quad <- optimize_effect_2(obj3) joint <- function(df, alpha, pUr, pUl) { Z1 <- df$Z1 Z2 <- df$Z2 X <- df$X Y <- df$Y pUr * pUl * (((pnorm(alpha[1] + alpha[2] * 1)) ^ Z1 * (1 - pnorm(alpha[1] + alpha[2] * 1)) ^ (1 - Z1)) * ((pnorm(alpha[3] + alpha[4] * 1 + alpha[5] * Z1)) ^ Z2 * (1 - pnorm(alpha[3] + alpha[4] * 1 + alpha[5] * Z1)) ^ (1 - Z2)) * ((pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 1)) ^ X * (1 - pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 1)) ^ (1 - X)) * (pnorm(alpha[10] + alpha[11] * X + alpha[12] * 1)) ^ Y * (1 - pnorm(alpha[10] + alpha[11] * X + alpha[12] * 1)) ^ (1 - Y)) + pUr * (1 - pUl) * (((pnorm(alpha[1] + alpha[2] * 0)) ^ Z1 * (1 - pnorm(alpha[1] + alpha[2] * 0)) ^ (1 - Z1)) * ((pnorm(alpha[3] + alpha[4] * 0 + alpha[5] * Z1)) ^ Z2 * (1 - pnorm(alpha[3] + alpha[4] * 0 + alpha[5] * Z1)) ^ (1 - Z2)) * ((pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 1)) ^ X * (1 - pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 1)) ^ (1 - X)) * (pnorm(alpha[10] + alpha[11] * X + alpha[12] * 1)) ^ Y * (1 - pnorm(alpha[10] + alpha[11] * X + alpha[12] * 1)) ^ (1 - Y)) + (1 - pUr) * pUl * (((pnorm(alpha[1] + alpha[2] * 1)) ^ Z1 * (1 - pnorm(alpha[1] + alpha[2] * 1)) ^ (1 - Z1)) * ((pnorm(alpha[3] + alpha[4] * 1 + alpha[5] * Z1)) ^ Z2 * (1 - pnorm(alpha[3] + alpha[4] * 1 + alpha[5] * Z1)) ^ (1 - Z2)) * ((pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 0)) ^ X * (1 - pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 0)) ^ (1 - X)) * (pnorm(alpha[10] + alpha[11] * X + alpha[12] * 0)) ^ Y * (1 - pnorm(alpha[10] + alpha[11] * X + alpha[12] * 0)) ^ (1 - Y)) + (1 - pUr) * (1 - pUl) * (((pnorm(alpha[1] + alpha[2] * 0)) ^ Z1 * (1 - pnorm(alpha[1] + alpha[2] * 0)) ^ (1 - Z1)) * ((pnorm(alpha[3] + alpha[4] * 0 + alpha[5] * Z1)) ^ Z2 * (1 - pnorm(alpha[3] + alpha[4] * 0 + alpha[5] * Z1)) ^ (1 - Z2)) * ((pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 0)) ^ X * (1 - pnorm(alpha[6] + alpha[7] * Z1 + alpha[8] * Z2 + alpha[9] * 0)) ^ (1 - X)) * (pnorm(alpha[10] + alpha[11] * X + alpha[12] * 0)) ^ Y * (1 - pnorm(alpha[10] + alpha[11] * X + alpha[12] * 0)) ^ (1 - Y)) } ## get conditional probabilities ## key = XY_Z1Z2 get_cond_probs <- function(p.vals) { z1z2.joint <- unique(p.vals[, c("Z1", "Z2")]) for(j in 1:nrow(z1z2.joint)) { z1z2.joint$Prob.condz1z2[j] <- sum(subset(p.vals, Z1 == z1z2.joint[j, "Z1"] & Z2 == z1z2.joint[j, "Z2"])$Prob) } p.vals.2 <- merge(p.vals, z1z2.joint, by = c("Z1", "Z2"), sort = FALSE) p.vals.2$Prob.cond.fin <- ifelse(p.vals.2$Prob ==0, 0.0, p.vals.2$Prob / p.vals.2$Prob.condz1z2) res <- as.list(p.vals.2$Prob.cond.fin) names(res) <- with(p.vals.2, paste0("p", X, Y, "_", Z1, Z2)) ## conditional on Z1 only xyz1.joint <- unique(p.vals[, c("Z1", "X", "Y")]) for(j in 1:nrow(xyz1.joint)) { xyz1.joint$Prob.xyz1[j] <- sum(subset(p.vals, Z1 == xyz1.joint$Z1[j] & X == xyz1.joint$X[j] & Y == xyz1.joint$Y[j])$Prob) } z1.marg0 <- sum(subset(xyz1.joint, Z1 == 0)$Prob.xyz1) z1.marg1 <- sum(subset(xyz1.joint, Z1 == 1)$Prob.xyz1) xyz1.joint$Prob.z1[xyz1.joint$Z1 == 0] <- z1.marg0 xyz1.joint$Prob.z1[xyz1.joint$Z1 == 1] <- z1.marg1 xyz1.joint$Prob.cond <- with(xyz1.joint, Prob.xyz1 / Prob.z1) res2 <- as.list(xyz1.joint$Prob.cond) names(res2) <- with(xyz1.joint, paste0("p", X, Y, "_", Z1)) ## conditioning on Z3 z3.joint <- unique(p.vals[, c("Z3"), drop = FALSE]) for(j in 1:nrow(z3.joint)) { z3.joint$Prob.condz3[j] <- sum(subset(p.vals, Z3 == z3.joint[j, "Z3"])$Prob) } p.vals.3 <- merge(p.vals, z3.joint, by = c("Z3"), sort = FALSE) p.vals.3$Prob.cond.fin <- ifelse(p.vals.3$Prob ==0, 0.0, p.vals.3$Prob / p.vals.3$Prob.condz3) res3 <- as.list(p.vals.3$Prob.cond.fin) names(res3) <- with(p.vals.3, paste0("p", X, Y, "_", Z3)) list(multi = res, sing = res2, quad = res3) } ## simulate and compare the two nsim <- 50000 f.multi <- interpret_bounds(bounds.multi$bounds, obj$parameters) f.single <- interpret_bounds(bounds.sing$bounds, obj2$parameters) f.quad <- interpret_bounds(bounds.quad$bounds, obj3$parameters) result <- matrix(NA, ncol = 9, nrow = nsim) set.seed(211129) for (i in 1:nsim) { alpha <- rnorm(12, sd = 2) pUr <- runif(1) pUl <- runif(1) p.vals.joint <- obj$p.vals p.vals.joint$Prob <- joint(p.vals.joint, alpha, pUr, pUl) p.vals.joint$Z3 <- with(p.vals.joint, ifelse(Z1 == 0 & Z2 == 0, 0, ifelse(Z1 == 0 & Z2 == 1, 1, ifelse(Z1 == 1 & Z2 == 0, 2, 3)))) if(any(p.vals.joint$Prob == 0)) next condprobs <- get_cond_probs(p.vals.joint) bees <- do.call(f.multi, condprobs$multi) bees.sing <- do.call(f.single, condprobs$sing) bees.quad <- do.call(f.quad, condprobs$quad) result[i, ] <- unlist(c(sort(unlist(bees)), abs(bees[2] - bees[1]), sort(unlist(bees.sing)), abs(bees.sing[2]- bees.sing[1]), sort(unlist(bees.quad)), abs(bees.quad[2]- bees.quad[1]))) } colnames(result) <- c("bound.lower", "bound.upper", "width.multi", "bound.lower.single", "bound.upper.single", "width.single", "bound.lower.quad", "bound.upper.quad", "width.quad") bounds.comparison <- as.data.frame(result) #pdf("figsim.pdf", width = 8, height = 4.25, family = "serif") par(mfrow = c(1,2)) plot(width.multi ~ width.single, data = bounds.comparison, pch = 20, cex = .3, xlim = c(0, 1), ylim = c(0, 1), xlab= "Single IV", ylab = "Two binary IV/Single 4-level IV", main = "Width of bounds intervals") abline(0, 1, lty = 3) plot(bound.lower.quad ~ bound.lower, data = bounds.comparison[1:100,], pch = 20, cex = 1, xlim = c(-1, 1), ylim = c(-1, 1), xlab = "Two binary IV", ylab = "Single 4-level IV", main = "Bounds values") points(bound.upper.quad ~ bound.upper, data = bounds.comparison[1:100,], pch = 1, cex = 1) legend("bottomright", pch = c(1, 20), legend = c("upper", "lower")) #dev.off() summary(bounds.comparison) # contains 467 NA's to avoid division by 0 # Verify that a single quad-level instrument yield the same bounds as two linked binary ones. all(round(x = bounds.comparison$bound.lower, digits = 12) == round(x = bounds.comparison$bound.lower.quad, digits = 12) && round(x = bounds.comparison$bound.upper, digits = 12) == round(x = bounds.comparison$bound.upper.quad, digits = 12), na.rm = TRUE) ``` ## measurement error in the outcome ```{r} b <- graph_from_literal(Ul -+ X -+ Y -+ Y2, Ur -+ Y, Ur -+ Y2) V(b)$leftside <- c(1, 1, 0, 0, 0) V(b)$latent <- c(1, 0, 1, 0, 1) V(b)$nvals <- c(2, 2, 2, 2, 2) E(b)$rlconnect <- c(0, 0, 0, 0, 0) E(b)$edge.monotone <- c(0, 0, 0, 0, 0) obj <- analyze_graph(b, constraints = "Y2(Y = 1) >= Y2(Y = 0)", effectt = "p{Y(X = 1) = 1} - p{Y(X = 0) = 1}") optimize_effect_2(obj) ```