lindsaycarbonell/scraper.py

## scraper.py
import requests
import http.cookiejar, urllib.request
import pandas as pd
import webbrowser
from bs4 import BeautifulSoup

url = "http://apps.schools.nc.gov/ords/f?p=1:220:1214343525970901::NO::P220_SELECTLEA:920"
response = requests.get(url)
html = response.content

soup = BeautifulSoup(html, "html.parser")
link_param = soup.find("div", attrs={'class':'t17CVS'}).a['href'];
link_to_click = "http://apps.schools.nc.gov/ords/" + link_param;

cj = http.cookiejar.CookieJar()
opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))

f = open("file.xls", "wb")
res = opener.open(link_to_click)
f.write(res.read())
f.close()
	import requests
	import http.cookiejar, urllib.request
	import pandas as pd
	import webbrowser
	from bs4 import BeautifulSoup

	url = "http://apps.schools.nc.gov/ords/f?p=1:220:1214343525970901::NO::P220_SELECTLEA:920"
	response = requests.get(url)
	html = response.content

	soup = BeautifulSoup(html, "html.parser")
	link_param = soup.find("div", attrs={'class':'t17CVS'}).a['href'];
	link_to_click = "http://apps.schools.nc.gov/ords/" + link_param;

	cj = http.cookiejar.CookieJar()
	opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))

	f = open("file.xls", "wb")
	res = opener.open(link_to_click)
	f.write(res.read())
	f.close()