Skip to content

Instantly share code, notes, and snippets.

View mrubash1's full-sized avatar

Matthew Rubashkin mrubash1

View GitHub Profile
# -*- coding: utf-8 -*-
import itertools
import re
import urlparse
import boto
import warc
from boto.s3.key import Key
from gzipstream import GzipStreamFile