jmcastagnetto/parse_data.R

## parse_data.R
library(tidyverse)
library(rvest)
library(V8)

url <- "https://www.greatschools.org/new-york/new-york/schools/?view=table"
xpath <- "/html/head/script[1]"

ctx <- v8()

txt <- read_html(url) %>%
  html_elements(xpath = xpath) %>%
  html_text(trim = TRUE) %>%
  str_replace(fixed("window.gon"), "gon")

tmpfile <- tempfile()
write_file(
  txt,
  file = tmpfile
)
txt2 <- read_lines(
  tmpfile
)

ctx$eval(txt2[2])
tmp <- ctx$get("gon")
df <- as_tibble(tmp$search$schools)
saveRDS(df, file = "schools.rds")
	library(tidyverse)
	library(rvest)
	library(V8)

	url <- "https://www.greatschools.org/new-york/new-york/schools/?view=table"
	xpath <- "/html/head/script[1]"

	ctx <- v8()

	txt <- read_html(url) %>%
	html_elements(xpath = xpath) %>%
	html_text(trim = TRUE) %>%
	str_replace(fixed("window.gon"), "gon")

	tmpfile <- tempfile()
	write_file(
	txt,
	file = tmpfile
	)
	txt2 <- read_lines(
	tmpfile
	)

	ctx$eval(txt2[2])
	tmp <- ctx$get("gon")
	df <- as_tibble(tmp$search$schools)
	saveRDS(df, file = "schools.rds")