Comparing COVID-19 daily deaths to 2018 top ten causes of death
## 2018 top causes of death:
nchs_df <- tribble(~ cause, ~ deaths_2018,
"1.Heart disease", 655381,
"2. Cancer", 599274,
"3. Accidents", 167127,
"4. Chronic lower respiratory diseases", 159486,
"5. Stroke", 147810,
"6. Alzheimer’s disease", 122019,
"7. Diabetes", 84946,
"8. Influenza and Pneumonia", 59120,
"9. Nephritis, nephrotic syndrome and nephrosis", 51386,
"10. Suicide", 48344
) %>%
mutate(deaths_per_day = deaths_2018 / 365)
nchs_df$x_val <- as.Date(c(
covid_df <- read_csv("") %>%
mutate(daily_deaths = deaths - lag(deaths, default = 0)) %>%
mutate(rolling_avg = zoo::rollmean(daily_deaths, k = 7, fill = 0, align = "right"))
p1 <- ggplot(data = covid_df,
aes(x = date, y = daily_deaths)) +
geom_col(alpha = .3) +
geom_line(aes(y = rolling_avg), color = "red", size = 1, alpha = .9) +
geom_hline(data = nchs_df,
aes(yintercept = deaths_per_day),
alpha = .5) +
geom_label_repel(data = nchs_df,
aes(x = x_val,
y = deaths_per_day,
label = cause),
force = 5) +
scale_y_continuous("Deaths per day", expand = c(0, .05)) +
date_breaks = "1 month",
date_labels = "%b",
expand = c(0, 0)) +
mk_nytimes() +
labs(title = "COVID-19 daily deaths vs 2018 Top Ten Causes of Death",
subtitle = "Daily COVID-19 deaths (grey bars) and 7-day rolling average (red line). Reference lines are total 2018 deaths divided by 365.",
caption = "COVID data: NYTimes. 2018 mortality data: NCHS. @mathewkiang")
width = 15,
height = 5,
scale = 1,
dpi = 300
