samrat/HN_grab.py

## HN_grab.py
import urllib2
from BeautifulSoup import BeautifulSoup

HN_url = "http://news.ycombinator.com"

def get_page():
	page_html = urllib2.urlopen(HN_url)
	return page_html

def get_stories(content):
	soup = BeautifulSoup(content)
	titles_html =[]

	for td in soup.findAll("td", { "class":"title" }):
		titles_html += td.findAll("a")

	return titles_html


for title_a in get_stories(get_page()):
	title = title_a.string.strip()
	url = title_a['href']
	print "*", title, url
	import urllib2
	from BeautifulSoup import BeautifulSoup

	HN_url = "http://news.ycombinator.com"

	def get_page():
	page_html = urllib2.urlopen(HN_url)
	return page_html

	def get_stories(content):
	soup = BeautifulSoup(content)
	titles_html =[]

	for td in soup.findAll("td", { "class":"title" }):
	titles_html += td.findAll("a")

	return titles_html


	for title_a in get_stories(get_page()):
	title = title_a.string.strip()
	url = title_a['href']
	print "*", title, url