isaqueprofeta/download.py

## download.py
import scrapy
from scrapy.http import Request


class SheetDownloader(scrapy.Spider):
    name = 'my_downloader'
    allowed_domains = ['mydomain.com']
    start_urls = [f'https://mydomain.com/path/list/{page}' for page in range(1, 100)]

    def parse(self, response):
        for href in response.css('tag.class'):
            yield Request(
                url='https://mydomain.com/' + href.attrib['href'],
                callback=self.save_pdf
            )

    def save_pdf(self, response):
        """ Save pdf files """
        path = response.url.split('/')[-1]
        self.logger.info('Saving PDF %s', path)
        with open(path, 'wb') as file:
            file.write(response.body)
	import scrapy
	from scrapy.http import Request


	class SheetDownloader(scrapy.Spider):
	name = 'my_downloader'
	allowed_domains = ['mydomain.com']
	start_urls = [f'https://mydomain.com/path/list/{page}' for page in range(1, 100)]

	def parse(self, response):
	for href in response.css('tag.class'):
	yield Request(
	url='https://mydomain.com/' + href.attrib['href'],
	callback=self.save_pdf
	)

	def save_pdf(self, response):
	""" Save pdf files """
	path = response.url.split('/')[-1]
	self.logger.info('Saving PDF %s', path)
	with open(path, 'wb') as file:
	file.write(response.body)