Dan Lewer danlewer

Public health researcher at Bradford Institute for Health Research and @UCL

danlewer / show_cols.R

Created June 1, 2025 19:28

Simple function to show a vector of colours in a plot device

	show_cols <- function (x) {
	plot(1, type = 'n', xlim = c(0, length(x)), ylim = c(0, 1), axes = F, xlab = NA, ylab = NA)
	rect(0:(length(x)-1), 0, 1:length(x), 1, col = x)
	}

danlewer / offsets_survival.R

Created November 20, 2024 15:08

	# simple simulation of survival data for use in regression analysis
	# shows that the effect of a risk factor on an outcome must be estimated using an offset term rather than adjusting for the follow-up duration

	# sample size
	n <- 1e5

	# simulate random binary exposure with 30% prevalence
	binary_exposure <- rbinom(n, 1, 0.3)

	# simulate total observation duration, associated with binary exposure

danlewer / risks_odds.R

Created September 16, 2024 06:42

	risk2odds <- function (risk) risk / (1-risk)
	odds2risk <- function (odds) odds / (1+odds)
	or2rr <- function (OR, p0) OR / ((1 - p0) + (p0 * OR))
	rr2or <- function(RR, p0) RR * (1 - p0) / (1 - RR * p0)

danlewer / roundup.R

Created August 20, 2024 12:45

Round up

danlewer / ris2csv.R

Last active July 30, 2024 10:45

Convert RIS to CSV (requires data.table)

	# Reads a RIS file and converts it into a 'wide' data.table
	# Where records have multiple entries for a field, eg. author or keyword, these are given numbered column names, eg. KW1, KW2 etc
	# Note if the field label already has a number, this will be maintained, eg. T1 (for title) becomes T11

	library(data.table)

	ris2csv <- function (file) { # 'file' is the ris file in your working directory, eg. 'myrisfile.ris'
	d <- readLines(file)
	d <- strsplit(d, " - ", fixed = T)
	d[sapply(d, length) == 0] <- 'NEW RECORD'

danlewer / standardised_cluster_means.R

Last active June 24, 2024 07:45

	library(lme4) # for ML/REML fitting of mixed models

	# ----------------------------------------------------------------------------------------------
	# simulate a clustered dataset with cluster-level outcome affected by an individual "confounder"
	# ----------------------------------------------------------------------------------------------

	# inputs
	# ------

	# sample size

danlewer / linear_interpolation.R

Last active April 12, 2024 07:35

	# linear interpolation of lines between x and y coordinates, with option to find specific intercepts
	# x must be positive monotonic, y does not need to be

	interpolate <- function (x, y, xIncrements = 0.01, findx = NULL, findy = NULL) {
	if (length(x) != length(y)) stop('length(x) does not equal length(y)')
	if (is.unsorted(x)) stop('x is not positive monotonic')
	dx <- diff(x)
	dy <- diff(y)
	xNotches <- round(dx / xIncrements, 0)
	yIncrements <- dy / xNotches

danlewer / kappa_vs_agreement.R

Created October 9, 2023 13:35

	# compare Cohen's kappa and % agreement
	# for two raters making a binary (yes/no) decision
	# assuming the same prevalence for both raters

	library(viridisLite)

	k <- function (Po, prevalence) {
	Pe <- (prevalence^2) + ((1-prevalence)^2)
	(Po - Pe) / (1 - Pe)
	}

danlewer / extend_letters.R

Last active February 19, 2024 19:01

	# Here's a function that allows you to specify the number of letters you want (eg. 5 would be A, B, C, D, and E), the length of the code (eg. 3 would be AAA, AAB, AAC, etc), the number of results you want (NA for all of them), and and separating character (eg. '-' would give A-A-A, A-A-B, A-A-C.)

	letterCodes <- function(nletters, case = 'upper', lengthCode, nResults = NA, sep = '') {
	f <- if (case == 'upper') LETTERS else letters
	a <- expand.grid(rep(list(f[1:nletters]), lengthCode))
	a <- a[, ncol(a):1]
	a <- do.call("paste", c(a, sep = sep))
	if (is.na(nResults)) a else a[1:min(nResults, length(a))]
	}

danlewer / table_specific_values.R

Last active January 29, 2023 21:48

	# return a table, but specify the values you want to be tabulated
	# works like base::table, but supplies only specified values, and returns 0 if none of those values exist in the vector

	tab_specific_values <- function(vector, values = unique(vector)) `names<-`(rowSums(outer(values, vector, `==`)), values)