Created
April 11, 2024 04:40
-
-
Save RyanGreenup/e84bfc29cab7a0145727e56324d9a777 to your computer and use it in GitHub Desktop.
How to calculate P Values in R
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
library(Lock5Data) | |
library(tidyverse) | |
dplyr::glimpse(Lock5Data::NutritionStudy) | |
## Get X | |
table(X <- Lock5Data::NutritionStudy$Smoke) | |
## Encode as "Does this person Smoke | |
table(X <- (X == "Yes")) | |
## How many people smoke | |
mean(X) | |
mean(!X) | |
## Hyptothesis | |
## H_0: ρ = 0.2 | |
## H_a: ρ ≢ 0.2 | |
## H_α: ρ ≥ 0.2 | |
## H_α: ρ ≤ 0.2 | |
n <- length(X) | |
## We can take a sample of something with a population of ρ = 0.2 | |
s <- sample(c(rep(0, 8), rep(1, 2))) | |
## Or | |
s <- sample(c(0, 1), replace = TRUE, prob = c(0.8, 0.2)) | |
## Or | |
s <- mean(rbinom(length(X), 1, prob = 0.2)) | |
## Now we can take that and get the proportion in our sample | |
mean(s) | |
## This can then be wrapped into a function to perform one experiment | |
sample_02_pop <- function() { | |
mean(rbinom(length(X), 1, prob = 0.2)) | |
} | |
sample_02_pop() | |
## If we run that many times we can get a distribution of sample proportions | |
sample_proportions <- replicate(10^4, sample_02_pop()) | |
## The number of false positives we would see is the p-value because | |
## we assumed the null hypothesis | |
(pval <- mean(sample_proportions < mean(X))) | |
alpha <- 0.05 | |
if (pval < alpha) { | |
cat("Reject H0 at ", alpha) | |
} else { | |
cat("Insufficient evidence to reject H0 at ", alpha) | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment