gnufs/webscraper.py

## webscraper.py
import sys, requests
from bs4 import BeautifulSoup

def scrape(url='http://example.com'):
	try:
		html = requests.get(url).content
	except:
		print "URL doesn\'t load"
		exit()
	page = BeautifulSoup(html)
	try:
		bodytext = page.body.findAll(text=True)
		for s in bodytext:
			print s
	except:
		print "Page could not be read."

if len(sys.argv) != 2:
	url = raw_input("Please enter a URL: ")
else:
	url = sys.argv[1]

if url.lower().startswith('http'):
	scrape(url)
	import sys, requests
	from bs4 import BeautifulSoup

	def scrape(url='http://example.com'):
	try:
	html = requests.get(url).content
	except:
	print "URL doesn\'t load"
	exit()
	page = BeautifulSoup(html)
	try:
	bodytext = page.body.findAll(text=True)
	for s in bodytext:
	print s
	except:
	print "Page could not be read."

	if len(sys.argv) != 2:
	url = raw_input("Please enter a URL: ")
	else:
	url = sys.argv[1]

	if url.lower().startswith('http'):
	scrape(url)