Skip to content

Instantly share code, notes, and snippets.

@kmike
kmike / idealspider.py
Last active August 29, 2015 14:05 — forked from dangra/idealspider.py
import scrapy
from scrapy.http import safeurl
class Spider(scrapy.Spider):
name = 'loremipsum'
start_urls = ('https://www.lipsum.com',)
def parse(self, response):
#!/usr/bin/env python2
# coding: utf-8
import nltk
def get_available_corpora():
for element in dir(nltk.corpus):
if element[0] == '_':
continue
elements_type = str(type(getattr(nltk.corpus, element)))