grabbing cambridge airphotos
from bs4 import BeautifulSoup
import csv
import requests
file = open("output.txt", "w")
# f = csv.writer(open("output.csv", "w"))
# f.writerow(["domain", "fulllink"])
pages = []
for i in range(1,2):
url = '' + str(i) + '.html'
for item in pages:
page = requests.get(item)
soup = BeautifulSoup(page.content, "html.parser")
divs = soup.find_all('div', attrs={"class": "cucapgallery naturalwidth compressed"})
for div in divs:
for link in div.find_all('a', attrs={"class": "lightbox"}):
fulllink = link.get ('href')
file.writelines(["", fulllink, "\n"])
import csv
import requests
import re
img = []
with open('output.txt') as csvfile:
csvrows = csv.reader(csvfile, delimiter=',', quotechar='"')
for row in csvrows:
filename = row[0]
filename = re.sub('[""]', '', filename)
url = row[0]
result = requests.get(url, stream=True)
if result.status_code == 200:
image =
open(filename + ".jpg","wb").write(image)
