skagedal/swepubscraper.py

## swepubscraper.py
from urllib.request import urlopen

counter = 1

while True:
	url = 'http://libris.kb.se/xsearch?d=swepub&hitlist&q=l%C3%A4ros%C3%A4te%3agu&f=ext&spell=true&hist=true&n=200&format=json&start=' + str(counter)
	print ("Fetching: " + url)
	data = urlopen(url).read()
	if not data.find(b'"identifier"') >= 0:
		print("No more records!")
		break
	with open(str(counter) + ".json", "wb") as outputfile:
		print("Writing file...")
		outputfile.write(data)
	counter += 200
	from urllib.request import urlopen

	counter = 1

	while True:
	url = 'http://libris.kb.se/xsearch?d=swepub&hitlist&q=l%C3%A4ros%C3%A4te%3agu&f=ext&spell=true&hist=true&n=200&format=json&start=' + str(counter)
	print ("Fetching: " + url)
	data = urlopen(url).read()
	if not data.find(b'"identifier"') >= 0:
	print("No more records!")
	break
	with open(str(counter) + ".json", "wb") as outputfile:
	print("Writing file...")
	outputfile.write(data)
	counter += 200