tinnet/urlchecker.py

## urlchecker.py
from __future__ import print_function

import argparse
import csv
import requests
import sys

_EPILOG = """
Script takes a list of .csv files, tries to guess their format (seperator),
then checks for a field called 'URL', tries to fetch that url and prints
the response code back out (with the history of codes attached if there where
redirects)."""

def find_url(row):
    if 'URL' in row:
        return row['URL']

    if 'url' in row:
        return row['url']

    if 'uri' in row:
        return row['uri']

if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='Checks urls from .csv files for their HTTP reponse codes', epilog=_EPILOG)
    parser.add_argument('files', type=str, metavar='CSVFILE', nargs='+')
    args = parser.parse_args()

    for file in args.files:
        with open(file, 'rU') as csvfile:
            dialect = csv.Sniffer().sniff(csvfile.read(1024))
            csvfile.seek(0)
            print('"URL";"STATUSCODE";"HISTORY"')
            for row in csv.DictReader(csvfile,dialect=dialect):
                r = requests.get(find_url(row))
                print('"{}";{};"{}"'.format(find_url(row), r.status_code, [h.status_code for h in r.history]))
	from __future__ import print_function

	import argparse
	import csv
	import requests
	import sys

	_EPILOG = """
	Script takes a list of .csv files, tries to guess their format (seperator),
	then checks for a field called 'URL', tries to fetch that url and prints
	the response code back out (with the history of codes attached if there where
	redirects)."""

	def find_url(row):
	if 'URL' in row:
	return row['URL']

	if 'url' in row:
	return row['url']

	if 'uri' in row:
	return row['uri']

	if __name__ == '__main__':
	parser = argparse.ArgumentParser(description='Checks urls from .csv files for their HTTP reponse codes', epilog=_EPILOG)
	parser.add_argument('files', type=str, metavar='CSVFILE', nargs='+')
	args = parser.parse_args()

	for file in args.files:
	with open(file, 'rU') as csvfile:
	dialect = csv.Sniffer().sniff(csvfile.read(1024))
	csvfile.seek(0)
	print('"URL";"STATUSCODE";"HISTORY"')
	for row in csv.DictReader(csvfile,dialect=dialect):
	r = requests.get(find_url(row))
	print('"{}";{};"{}"'.format(find_url(row), r.status_code, [h.status_code for h in r.history]))