palewire/albums.py

## albums.py
from mechanize import Browser
from BeautifulSoup import BeautifulSoup

def extract(html):
    soup = BeautifulSoup(html)
    table = soup.find("table", border=1)
    list_of_rows = []
    for row in table.findAll('tr')[1:]:
        list_of_cells = []
        for cell in row.findAll('td'):
            text = cell.text.replace("&nbsp;", "")
            list_of_cells.append(text)
        list_of_rows.append(list_of_cells)
    return list_of_rows

url = 'http://palewi.re/scrape/albums/2006.html'
mech = Browser()

page = mech.open(url)
html = page.read()
rows = extract(html)

page2 = mech.follow_link(text_regex="Previous")
html2 = page2.read()
rows2 = extract(html2)
	from mechanize import Browser
	from BeautifulSoup import BeautifulSoup

	def extract(html):
	soup = BeautifulSoup(html)
	table = soup.find("table", border=1)
	list_of_rows = []
	for row in table.findAll('tr')[1:]:
	list_of_cells = []
	for cell in row.findAll('td'):
	text = cell.text.replace(" ", "")
	list_of_cells.append(text)
	list_of_rows.append(list_of_cells)
	return list_of_rows

	url = 'http://palewi.re/scrape/albums/2006.html'
	mech = Browser()

	page = mech.open(url)
	html = page.read()
	rows = extract(html)

	page2 = mech.follow_link(text_regex="Previous")
	html2 = page2.read()
	rows2 = extract(html2)