- first thing i need to do
- second thing i need to do
- third thing i need to do
| import os | |
| from scrapy.dupefilter import RFPDupeFilter | |
| from scrapy.utils.request import request_fingerprint | |
| class CustomFilter(RFPDupeFilter): | |
| """A dupe filter that considers specific ids in the url""" | |
| def __getid(self, url): | |
| mm = url.split("&refer")[0] #or something like that |
| # !/usr/bin/env python | |
| # -*- coding:utf-8 -*- | |
| import sys | |
| import time | |
| import Queue | |
| import threading | |
| import traceback | |
| class ExitException(Exception): |