fmoliveira/webscraping_nyc_mta.py

## webscraping_nyc_mta.py
# Import libraries
import requests
import urllib.request
import time
from bs4 import BeautifulSoup

# Set the URL you want to webscrape from
url = 'http://web.mta.info/developers/turnstile.html'

# Connect to the URL
response = requests.get(url)

# Parse HTML and save to BeautifulSoup object¶
soup = BeautifulSoup(response.text, "html.parser")

# To download the whole data set, let's do a for loop through all a tags
for i in range(36,len(soup.findAll('a'))+1): #'a' tags are for links
    one_a_tag = soup.findAll('a')[i]
    link = one_a_tag['href']
    download_url = 'http://web.mta.info/developers/'+ link
    urllib.request.urlretrieve(download_url,'./'+link[link.find('/turnstile_')+1:])
    time.sleep(1) #pause the code for a sec
	# Import libraries
	import requests
	import urllib.request
	import time
	from bs4 import BeautifulSoup

	# Set the URL you want to webscrape from
	url = 'http://web.mta.info/developers/turnstile.html'

	# Connect to the URL
	response = requests.get(url)

	# Parse HTML and save to BeautifulSoup object¶
	soup = BeautifulSoup(response.text, "html.parser")

	# To download the whole data set, let's do a for loop through all a tags
	for i in range(36,len(soup.findAll('a'))+1): #'a' tags are for links
	one_a_tag = soup.findAll('a')[i]
	link = one_a_tag['href']
	download_url = 'http://web.mta.info/developers/'+ link
	urllib.request.urlretrieve(download_url,'./'+link[link.find('/turnstile_')+1:])
	time.sleep(1) #pause the code for a sec