rentrop · December 3, 2023 06:01 · rentrop · Sep 26, 2015 · Matherion · Mar 17, 2016
diff --git a/gg_qq.r b/gg_qq.r
 gg_qq <- function(x, distribution = "norm", ..., line.estimate = NULL, conf = 0.95,
                  labels = names(x)){
  q.function <- eval(parse(text = paste0("q", distribution)))
  d.function <- eval(parse(text = paste0("d", distribution)))
  x <- na.omit(x)
  ord <- order(x)
  n <- length(x)
  P <- ppoints(length(x))
  df <- data.frame(ord.x = x[ord], z = q.function(P, ...))

  if(is.null(line.estimate)){
    Q.x <- quantile(df$ord.x, c(0.25, 0.75))
    Q.z <- q.function(c(0.25, 0.75), ...)
    b <- diff(Q.x)/diff(Q.z)
    coef <- c(Q.x[1] - b * Q.z[1], b)
  } else {
    coef <- coef(line.estimate(ord.x ~ z))
  }

  zz <- qnorm(1 - (1 - conf)/2)
  SE <- (coef[2]/d.function(df$z)) * sqrt(P * (1 - P)/n)
  fit.value <- coef[1] + coef[2] * df$z
  df$upper <- fit.value + zz * SE
  df$lower <- fit.value - zz * SE

  if(!is.null(labels)){ 
    df$label <- ifelse(df$ord.x > df$upper | df$ord.x < df$lower, labels[ord],"")
    }

  p <- ggplot(df, aes(x=z, y=ord.x)) +
    geom_point() + 
    geom_abline(intercept = coef[1], slope = coef[2]) +
    geom_ribbon(aes(ymin = lower, ymax = upper), alpha=0.2) 
  if(!is.null(labels)) p <- p + geom_text( aes(label = label))
  print(p)
  coef
 }
diff --git a/test.R b/test.R
 Animals2 <- data(Animals2, package = "robustbase")
 mod.lm <- lm(log(Animals2$brain) ~ log(Animals2$body))
 x <- rstudent(mod.lm)
 gg_qq(x)

 # See http://stackoverflow.com/questions/4357031/qqnorm-and-qqline-in-ggplot2/#27191036
	gg_qq <- function(x, distribution = "norm", ..., line.estimate = NULL, conf = 0.95,
	labels = names(x)){
	q.function <- eval(parse(text = paste0("q", distribution)))
	d.function <- eval(parse(text = paste0("d", distribution)))
	x <- na.omit(x)
	ord <- order(x)
	n <- length(x)
	P <- ppoints(length(x))
	df <- data.frame(ord.x = x[ord], z = q.function(P, ...))

	if(is.null(line.estimate)){
	Q.x <- quantile(df$ord.x, c(0.25, 0.75))
	Q.z <- q.function(c(0.25, 0.75), ...)
	b <- diff(Q.x)/diff(Q.z)
	coef <- c(Q.x[1] - b * Q.z[1], b)
	} else {
	coef <- coef(line.estimate(ord.x ~ z))
	}

	zz <- qnorm(1 - (1 - conf)/2)
	SE <- (coef[2]/d.function(df$z)) * sqrt(P * (1 - P)/n)
	fit.value <- coef[1] + coef[2] * df$z
	df$upper <- fit.value + zz * SE
	df$lower <- fit.value - zz * SE

	if(!is.null(labels)){
	df$label <- ifelse(df$ord.x > df$upper \| df$ord.x < df$lower, labels[ord],"")
	}

	p <- ggplot(df, aes(x=z, y=ord.x)) +
	geom_point() +
	geom_abline(intercept = coef[1], slope = coef[2]) +
	geom_ribbon(aes(ymin = lower, ymax = upper), alpha=0.2)
	if(!is.null(labels)) p <- p + geom_text( aes(label = label))
	print(p)
	coef
	}
	Animals2 <- data(Animals2, package = "robustbase")
	mod.lm <- lm(log(Animals2$brain) ~ log(Animals2$body))
	x <- rstudent(mod.lm)
	gg_qq(x)

	# See http://stackoverflow.com/questions/4357031/qqnorm-and-qqline-in-ggplot2/#27191036