Max Turgeon turgeonmaxime

## posthoc_power_analysis.R
mu <- 0.1
sigma <- 1
nsamp <- 36
B <- 1000

real_power <- power.t.test(delta = mu, sd = sigma, n = nsamp,
                           alternative = "one.sided",
                           type = "one.sample")$power

res <- replicate(B, {

## extract_annotations.R
library(stringr)

data_path <- 'somefolder/planet04_rgbn_c9_r8.txt'

# We want to extract 9 and 8
basename(data_path)

# Too many numbers
str_extract_all(basename(data_path), "([0-9]+)")
# [[1]]

## sens_spec_sim.R
library(tidyverse)

expit <- function(t) exp(t)/(1 + exp(t))

n <- 1000000
prev_vec <- c(0.01, 0.05, 0.1, 0.25, 0.5)

results <- purrr::map_df(prev_vec, \(prev) {
    # Generate data
    dvec <- rbinom(n, prob = prev, size = 1)

## dotplot_ToothGrowth.R
library(tidyverse)
library(cowplot)

gg1 <- ggplot(ToothGrowth, aes(x = len)) +
    geom_dotplot(aes(fill = as.factor(dose)),
                 binwidth = .5) +
    guides(fill = FALSE)

ToothGrowth2 <- arrange(ToothGrowth, len)
gg2 <- ggplot(ToothGrowth, aes(x = len, group = factor(dose))) +

## airport_delay.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                turgeonmaxime
                / airport_delay.md
            
            
              Created
              January 21, 2022 15:13
            
          
    library(tidyverse)
library(nycflights13)

delay <- flights |> 
    group_by(dest) |> 
    summarize(means = mean(dep_delay, na.rm = TRUE))

joined <- inner_join(delay, flights, by = "dest")

  
## cox_cb_poisson_comparison.R
#----
# Poisson vs casebase
# authors: Max Turgeon, Jesse Islam and Sahir Bhatnagar
# date: 10/1/2021
#----
set.seed(1952)

library(casebase)
library(cowplot)
library(Epi)

## t-test_outliers.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                turgeonmaxime
                / t-test_outliers.md
            
            
              Last active
              October 28, 2021 19:26
            
              
                Simulation study looking at the effect of outliers on the Type I error rate of the t-test
              
          
    B <- 1000
n <- 20
sigma <- 10
p <- 0.9
alpha <- 0.05

results <- replicate(B, {
    norm_vars1 <- rnorm(n)
 # Contaminated normal

  
## casebase_inset.R
library(casebase)
library(survival)
library(splines)
library(tidyverse)
library(cowplot)

# 1. Fit casebase with splines----
data("ERSPC")
ERSPC <- mutate(ERSPC, ScrArm = factor(ScrArm,
                                       levels = c(0,1),

## sk_vaccine.R
library(tidyverse)
library(RcppRoll)
library(rvest)


# Create temporary directory
tmp_dir <- tempdir()
file_path <- paste0(tmp_dir, "/vaccine_sk.csv")

# Download file

## covid_alberta_sask.R
library(tidyverse)
library(lubridate)
library(readr)

data_hr <- read_csv("https://raw.githubusercontent.com/ishaberry/Covid19Canada/master/timeseries_hr/cases_timeseries_hr.csv")

# Coerce string to dates and factor provinces
data_cum <- data_hr %>%
    filter(province %in% c("Alberta", "Saskatchewan")) %>%
    mutate(date_report = lubridate::dmy(date_report)) %>%
	mu <- 0.1
	sigma <- 1
	nsamp <- 36
	B <- 1000

	real_power <- power.t.test(delta = mu, sd = sigma, n = nsamp,
	alternative = "one.sided",
	type = "one.sample")$power

	res <- replicate(B, {
	library(stringr)

	data_path <- 'somefolder/planet04_rgbn_c9_r8.txt'

	# We want to extract 9 and 8
	basename(data_path)

	# Too many numbers
	str_extract_all(basename(data_path), "([0-9]+)")
	# [[1]]
	library(tidyverse)

	expit <- function(t) exp(t)/(1 + exp(t))

	n <- 1000000
	prev_vec <- c(0.01, 0.05, 0.1, 0.25, 0.5)

	results <- purrr::map_df(prev_vec, \(prev) {
	# Generate data
	dvec <- rbinom(n, prob = prev, size = 1)
	library(tidyverse)
	library(cowplot)

	gg1 <- ggplot(ToothGrowth, aes(x = len)) +
	geom_dotplot(aes(fill = as.factor(dose)),
	binwidth = .5) +
	guides(fill = FALSE)

	ToothGrowth2 <- arrange(ToothGrowth, len)
	gg2 <- ggplot(ToothGrowth, aes(x = len, group = factor(dose))) +
	#----
	# Poisson vs casebase
	# authors: Max Turgeon, Jesse Islam and Sahir Bhatnagar
	# date: 10/1/2021
	#----
	set.seed(1952)

	library(casebase)
	library(cowplot)
	library(Epi)
	library(casebase)
	library(survival)
	library(splines)
	library(tidyverse)
	library(cowplot)

	# 1. Fit casebase with splines----
	data("ERSPC")
	ERSPC <- mutate(ERSPC, ScrArm = factor(ScrArm,
	levels = c(0,1),
	library(tidyverse)
	library(RcppRoll)
	library(rvest)


	# Create temporary directory
	tmp_dir <- tempdir()
	file_path <- paste0(tmp_dir, "/vaccine_sk.csv")

	# Download file
	library(tidyverse)
	library(lubridate)
	library(readr)

	data_hr <- read_csv("https://raw.githubusercontent.com/ishaberry/Covid19Canada/master/timeseries_hr/cases_timeseries_hr.csv")

	# Coerce string to dates and factor provinces
	data_cum <- data_hr %>%
	filter(province %in% c("Alberta", "Saskatchewan")) %>%
	mutate(date_report = lubridate::dmy(date_report)) %>%