tecknoh19/pdf_dl.py

## pdf_dl.py
# Downloads all PDF files in given URL
# USAGE: pdf_dl.py <URL>
from bs4 import BeautifulSoup
import urllib2
import sys

resp = urllib2.urlopen(sys.argv[1])
soup = BeautifulSoup(resp, from_encoding=resp.info().getparam('charset'))

for link in soup.find_all('a', href=True):
        if ".pdf" in link['href']:
                print "Downloading " + link['href']
                dl = urllib2.urlopen(sys.argv[1] + link['href'])
                fh = open(link['href'], "w")
                fh.write(dl.read())
                fh.close()
	# Downloads all PDF files in given URL
	# USAGE: pdf_dl.py <URL>
	from bs4 import BeautifulSoup
	import urllib2
	import sys

	resp = urllib2.urlopen(sys.argv[1])
	soup = BeautifulSoup(resp, from_encoding=resp.info().getparam('charset'))

	for link in soup.find_all('a', href=True):
	if ".pdf" in link['href']:
	print "Downloading " + link['href']
	dl = urllib2.urlopen(sys.argv[1] + link['href'])
	fh = open(link['href'], "w")
	fh.write(dl.read())
	fh.close()