amferraz/main.py

## main.py
from twisted.internet import reactor
from scrapy.crawler import Crawler
from scrapy.settings import Settings
from scrapy import signals
from testspiders.spiders.followall import FollowAllSpider


class MyPipeline(object):

    def process_item(self, item, spider):
        print item['url']


spider = FollowAllSpider(domain='scrapinghub.com')

# take a look
# https://scrapy.readthedocs.org/en/latest/topics/item-pipeline.html?#activating-an-item-pipeline-component
settings = Settings(
    {
        'ITEM_PIPELINES': {
            'main.MyPipeline': 1
        }
    }
)

crawler = Crawler(settings)
crawler.signals.connect(reactor.stop, signal=signals.spider_closed)
crawler.configure()
crawler.crawl(spider)
crawler.start()
crawler.stats
reactor.run()
	from twisted.internet import reactor
	from scrapy.crawler import Crawler
	from scrapy.settings import Settings
	from scrapy import signals
	from testspiders.spiders.followall import FollowAllSpider


	class MyPipeline(object):

	def process_item(self, item, spider):
	print item['url']


	spider = FollowAllSpider(domain='scrapinghub.com')

	# take a look
	# https://scrapy.readthedocs.org/en/latest/topics/item-pipeline.html?#activating-an-item-pipeline-component
	settings = Settings(
	{
	'ITEM_PIPELINES': {
	'main.MyPipeline': 1
	}
	}
	)

	crawler = Crawler(settings)
	crawler.signals.connect(reactor.stop, signal=signals.spider_closed)
	crawler.configure()
	crawler.crawl(spider)
	crawler.start()
	crawler.stats
	reactor.run()