seandlg/imagedownloader.py

## imagedownloader.py
# begin by executing: "scrapy shell {link to flat}"
# scrapy exposes a response object that is used in the
# in the following few lines of code. Run the lines
# individually or simply execute the script by running
# "exec(open('imagedownloader.py').read())" in the
# scrapy shell.

import urllib.request

divs = response.css('div')
divsWithDataSrc = []

for div in divs:
	try:
		dataSrc = div.attrib['data-src']
		divsWithDataSrc.append(dataSrc)
		print("Added a div")
	except KeyError:
		print("Skipped a div")

downloadLinks = list(map((lambda x: "http://" + x.split('//')[1]), divsWithDataSrc))

for i,link in enumerate(downloadLinks):
	urllib.request.urlretrieve(link, str(i)+".jpg")
	print(f"Successfully downloaded image #{i}.")
	# begin by executing: "scrapy shell {link to flat}"
	# scrapy exposes a response object that is used in the
	# in the following few lines of code. Run the lines
	# individually or simply execute the script by running
	# "exec(open('imagedownloader.py').read())" in the
	# scrapy shell.

	import urllib.request

	divs = response.css('div')
	divsWithDataSrc = []

	for div in divs:
	try:
	dataSrc = div.attrib['data-src']
	divsWithDataSrc.append(dataSrc)
	print("Added a div")
	except KeyError:
	print("Skipped a div")

	downloadLinks = list(map((lambda x: "http://" + x.split('//')[1]), divsWithDataSrc))

	for i,link in enumerate(downloadLinks):
	urllib.request.urlretrieve(link, str(i)+".jpg")
	print(f"Successfully downloaded image #{i}.")