dsparks · December 18, 2012 22:31 · stapial · Mar 7, 2018 · ksorby · Mar 12, 2018
diff --git a/coefficent_plot_walkthrough.R b/coefficent_plot_walkthrough.R
 doInstall <- TRUE
 toInstall <- c("ggplot2")
 if(doInstall){install.packages(toInstall, repos = "http://cran.us.r-project.org")}
 lapply(toInstall, library, character.only = TRUE)

 ANES <- read.csv("http://www.oberlin.edu/faculty/cdesante/assets/downloads/ANES.csv")
 ANES <- ANES[ANES$year == 2008, -c(1, 11, 17)]  # Limit to just 2008 respondents,
 head(ANES)  # remove some non-helpful variables

 # Fit several models with the same DV:
 model1 <- lm(pid7 ~ ideo7 + female + age + south, data = ANES)
 model2 <- lm(pid7 ~ ideo7 + female + age + female:age, data = ANES)
 model3 <- lm(pid7 ~ ideo7, data = ANES)  # These are just arbitrary examples

 # Put model estimates into temporary data.frames:
 model1Frame <- data.frame(Variable = rownames(summary(model1)$coef),
                          Coefficient = summary(model1)$coef[, 1],
                          SE = summary(model1)$coef[, 2],
                          modelName = "South Indicator")
 model2Frame <- data.frame(Variable = rownames(summary(model2)$coef),
                          Coefficient = summary(model2)$coef[, 1],
                          SE = summary(model2)$coef[, 2],
                          modelName = "Age Interaction")
 model3Frame <- data.frame(Variable = rownames(summary(model3)$coef),
                          Coefficient = summary(model3)$coef[, 1],
                          SE = summary(model3)$coef[, 2],
                          modelName = "Univariate")
 # Combine these data.frames
 allModelFrame <- data.frame(rbind(model1Frame, model2Frame, model3Frame))  # etc.

 # Specify the width of your confidence intervals
 interval1 <- -qnorm((1-0.9)/2)  # 90% multiplier
 interval2 <- -qnorm((1-0.95)/2)  # 95% multiplier

 # Plot
 zp1 <- ggplot(allModelFrame, aes(colour = modelName))
 zp1 <- zp1 + geom_hline(yintercept = 0, colour = gray(1/2), lty = 2)
 zp1 <- zp1 + geom_linerange(aes(x = Variable, ymin = Coefficient - SE*interval1,
                                ymax = Coefficient + SE*interval1),
                            lwd = 1, position = position_dodge(width = 1/2))
 zp1 <- zp1 + geom_pointrange(aes(x = Variable, y = Coefficient, ymin = Coefficient - SE*interval2,
                                 ymax = Coefficient + SE*interval2),
                             lwd = 1/2, position = position_dodge(width = 1/2),
                             shape = 21, fill = "WHITE")
 zp1 <- zp1 + coord_flip() + theme_bw()
 zp1 <- zp1 + ggtitle("Comparing several models")
 print(zp1)  # The trick to these is position_dodge().
	doInstall <- TRUE
	toInstall <- c("ggplot2")
	if(doInstall){install.packages(toInstall, repos = "http://cran.us.r-project.org")}
	lapply(toInstall, library, character.only = TRUE)

	ANES <- read.csv("http://www.oberlin.edu/faculty/cdesante/assets/downloads/ANES.csv")
	ANES <- ANES[ANES$year == 2008, -c(1, 11, 17)] # Limit to just 2008 respondents,
	head(ANES) # remove some non-helpful variables

	# Fit several models with the same DV:
	model1 <- lm(pid7 ~ ideo7 + female + age + south, data = ANES)
	model2 <- lm(pid7 ~ ideo7 + female + age + female:age, data = ANES)
	model3 <- lm(pid7 ~ ideo7, data = ANES) # These are just arbitrary examples

	# Put model estimates into temporary data.frames:
	model1Frame <- data.frame(Variable = rownames(summary(model1)$coef),
	Coefficient = summary(model1)$coef[, 1],
	SE = summary(model1)$coef[, 2],
	modelName = "South Indicator")
	model2Frame <- data.frame(Variable = rownames(summary(model2)$coef),
	Coefficient = summary(model2)$coef[, 1],
	SE = summary(model2)$coef[, 2],
	modelName = "Age Interaction")
	model3Frame <- data.frame(Variable = rownames(summary(model3)$coef),
	Coefficient = summary(model3)$coef[, 1],
	SE = summary(model3)$coef[, 2],
	modelName = "Univariate")
	# Combine these data.frames
	allModelFrame <- data.frame(rbind(model1Frame, model2Frame, model3Frame)) # etc.

	# Specify the width of your confidence intervals
	interval1 <- -qnorm((1-0.9)/2) # 90% multiplier
	interval2 <- -qnorm((1-0.95)/2) # 95% multiplier

	# Plot
	zp1 <- ggplot(allModelFrame, aes(colour = modelName))
	zp1 <- zp1 + geom_hline(yintercept = 0, colour = gray(1/2), lty = 2)
	zp1 <- zp1 + geom_linerange(aes(x = Variable, ymin = Coefficient - SE*interval1,
	ymax = Coefficient + SE*interval1),
	lwd = 1, position = position_dodge(width = 1/2))
	zp1 <- zp1 + geom_pointrange(aes(x = Variable, y = Coefficient, ymin = Coefficient - SE*interval2,
	ymax = Coefficient + SE*interval2),
	lwd = 1/2, position = position_dodge(width = 1/2),
	shape = 21, fill = "WHITE")
	zp1 <- zp1 + coord_flip() + theme_bw()
	zp1 <- zp1 + ggtitle("Comparing several models")
	print(zp1) # The trick to these is position_dodge().