Kieran R Campbell kieranrcampbell

Researcher, statistical machine learning for genomics

kieranrcampbell / rounding_in_R.R

Created January 2, 2018 23:06

	#' These functions round an input string 'x' to a desired
	#' number of decimal places
	round1 <- function(x) format(round(x, 1), nsmall = 1)
	round2 <- function(x) format(round(x, 2), nsmall = 2)
	roundn <- function(x, n = 2) format(round(x, n), nsmall = n)

kieranrcampbell / convert_ensembl_gene_id_to_symbols.R

Created February 16, 2018 21:49

	library(biomaRt)
	ensembl <- useMart("ensembl")
	ensembl <- useDataset("hsapiens_gene_ensembl", mart=ensembl)
	bm <- getBM(attributes = c("ensembl_gene_id", "hgnc_symbol"),
	filters = c("ensembl_gene_id"),
	values = ensembl_gene_ids,
	mart = ensembl) %>%
	as_data_frame()

kieranrcampbell / voom_de.R

Created March 20, 2018 22:40

example differential expression with limma voom

	library(limma)
	library(tidyverse)

	dge <- DGEList(counts(sce_de))
	dge <- calcNormFactors(dge)

	design <- model.matrix(~ (dbz_cluster_str == "Unknown"), colData(sce_de)) # Your design matrix here

	v <- voom(dge, design, plot = TRUE)

kieranrcampbell / get rmarkdown to properly build

Created April 4, 2018 19:03

export PATH=$PATH:/Applications/RStudio.app/Contents/MacOS/pandoc

kieranrcampbell / pretty_cnv_heatmap.R

Created April 10, 2018 18:26

	#' Plot a CNV heatmap
	#' \code{cnv_data} must have the following columns:
	#'
	#' - start (start position of each region)
	#' - chr (chromosome)
	#' - single_cell_id (id of each cell)
	#' - clone (clone to which each cell is assigned)
	#' - copy_number (copy number of each clone in region)
	#'
	#' @export

kieranrcampbell / prioritize-dplyr.R

Created May 9, 2018 18:00

kieranrcampbell / source-hdf5.R

Created June 13, 2018 20:00

	#' Source an HDF5 file (ignoring all groups) where each
	#' entry in the HDF5 is read and assigned to a variable
	#' in the current environment
	#' @importFrom rhdf5 h5ls
	source_hdf5 <- function(filename, e) {
	ls <- h5ls(filename)
	vars <- ls$name
	for(var in vars) {
	assign(var, h5read(filename, var), envir = e)
	}

kieranrcampbell / sce-utils.R

Created July 26, 2018 19:48

	# Some common functions for manipulating bioconductor SingleCellExperiment objects

	#' Return the corresponding ensembl gene id for a symbol in a given SCE
	get_ensembl_id <- function(symbol, sce) {
	stopifnot(symbol %in% rowData(sce)$Symbol)
	rownames(sce)[rowData(sce)$Symbol == symbol]
	}

	#' Prepare an SCE read using read10XUtils for SC3
	prepare_for_sc3 <- function(sce) {

kieranrcampbell / clustermap.R

Created September 26, 2018 22:09

	clusterMap <- function(sce1, sce2) {

	clusters1 <- sort(unique(sce1$cluster)) # get unique clusters
	clusters2 <- sort(unique(sce2$cluster))

	# Check this is gene (row) by cluster (cell) - if not needs transposed
	cluster_means_1 <- sapply(clusters1, function(x) {
	rowMeans(as.matrix(logcounts(sce1[,sce1$cluster == x]))
	}))

kieranrcampbell / get_ensembl_id.R

Created October 18, 2018 21:37

	get_ensembl_id <- function(symbol, sce) {
	if(!(symbol %in% rowData(sce)$Symbol)) {
	stop("Symbol not in SCE genes")
	}
	rownames(sce)[rowData(sce)$Symbol == symbol]
	}