CrazyCoder/springer.py

## springer.py
# 1. Open https://link.springer.com/search/page/1?facet-content-type=%22Book%22&package=mat-covid19_textbooks
# 2. Click on the button on the top right of the table to save results into CSV file (SearchResults.csv)
# 3. Run: python springer.py SearchResults.csv
# Note: Python 3 is needed, `pip install requests` if the module is missing

import sys
import csv
import requests
from pathlib import Path
from os import path
import re


def get_valid_filename(s):
    return re.sub(r'(?u)[^- \w.]', '', s.strip())


def download_file(ext):
    try:
        if path.exists(f'{file_name}.{ext}'):
            print(f'EXISTS: {file_name}.{ext}')
            return

        print(f'Downloading {ext.upper()}')

        ctx = "content" if ext == "pdf" else "download"
        url = f'https://link.springer.com/{ctx}/{ext}/{row["Item DOI"]}.{ext}'
        content = requests.get(url)

        if len(content.content) < 500:
            raise Exception(f'Not a {ext.upper()}')
        open(f'{file_name}.{ext}', 'wb').write(content.content)
    except:
        print(f'Failed to download {ext.upper()} for {row["Item Title"]} by {row["Authors"]}')


if __name__ == '__main__':
    with open(sys.argv[1], encoding='utf-8') as csv_file:
        csv = csv.DictReader(csv_file, delimiter=",", quoting=csv.QUOTE_ALL)

        next(csv)

        for row in csv:
            print(f'Processing: "{row["Item Title"]} by {row["Authors"]}"')
            file_name = f'{Path(sys.argv[1]).parent}/' + get_valid_filename(f'{row["Item Title"]} - {row["Authors"]}')

            download_file("pdf")
            download_file("epub")
	# 1. Open https://link.springer.com/search/page/1?facet-content-type=%22Book%22&package=mat-covid19_textbooks
	# 2. Click on the button on the top right of the table to save results into CSV file (SearchResults.csv)
	# 3. Run: python springer.py SearchResults.csv
	# Note: Python 3 is needed, `pip install requests` if the module is missing

	import sys
	import csv
	import requests
	from pathlib import Path
	from os import path
	import re


	def get_valid_filename(s):
	return re.sub(r'(?u)[^- \w.]', '', s.strip())


	def download_file(ext):
	try:
	if path.exists(f'{file_name}.{ext}'):
	print(f'EXISTS: {file_name}.{ext}')
	return

	print(f'Downloading {ext.upper()}')

	ctx = "content" if ext == "pdf" else "download"
	url = f'https://link.springer.com/{ctx}/{ext}/{row["Item DOI"]}.{ext}'
	content = requests.get(url)

	if len(content.content) < 500:
	raise Exception(f'Not a {ext.upper()}')
	open(f'{file_name}.{ext}', 'wb').write(content.content)
	except:
	print(f'Failed to download {ext.upper()} for {row["Item Title"]} by {row["Authors"]}')


	if __name__ == '__main__':
	with open(sys.argv[1], encoding='utf-8') as csv_file:
	csv = csv.DictReader(csv_file, delimiter=",", quoting=csv.QUOTE_ALL)

	next(csv)

	for row in csv:
	print(f'Processing: "{row["Item Title"]} by {row["Authors"]}"')
	file_name = f'{Path(sys.argv[1]).parent}/' + get_valid_filename(f'{row["Item Title"]} - {row["Authors"]}')

	download_file("pdf")
	download_file("epub")