Pradip-p/spider.py

## spider.py
import scrapy
from scrapy.crawler import CrawlerProcess
from scrapy.utils.project import get_project_settings

class LazyCrawler(scrapy.Spider):

    name = "quotes"

    def start_requests(self):

        url = 'http://quotes.toscrape.com/'

        tag = getattr(self, 'tag', None)
        if tag is not None:
            url = url + 'tag/' + tag
        yield scrapy.Request(url, self.parse)

    def parse(self, response):
        # to_browser(response)
        for quote in response.css('div.quote'):
            yield {
                'author': quote.css('small.author::text').get(),
                'text': quote.css('span.text::text').get(),
                'tag':quote.css('.tags a.tag::text').get(),


            }
        next_page = response.css('li.next a::attr(href)').get()
        if next_page is not None:
            yield response.follow(next_page, self.parse)

process = CrawlerProcess(get_project_settings())
process.crawl(LazyCrawler)
process.start() # the script will block here until the crawling is finished
	import scrapy
	from scrapy.crawler import CrawlerProcess
	from scrapy.utils.project import get_project_settings

	class LazyCrawler(scrapy.Spider):

	name = "quotes"

	def start_requests(self):

	url = 'http://quotes.toscrape.com/'

	tag = getattr(self, 'tag', None)
	if tag is not None:
	url = url + 'tag/' + tag
	yield scrapy.Request(url, self.parse)

	def parse(self, response):
	# to_browser(response)
	for quote in response.css('div.quote'):
	yield {
	'author': quote.css('small.author::text').get(),
	'text': quote.css('span.text::text').get(),
	'tag':quote.css('.tags a.tag::text').get(),


	}
	next_page = response.css('li.next a::attr(href)').get()
	if next_page is not None:
	yield response.follow(next_page, self.parse)

	process = CrawlerProcess(get_project_settings())
	process.crawl(LazyCrawler)
	process.start() # the script will block here until the crawling is finished