vetri02/scrap_github_explore.py

## scrap_github_explore.py
import requests

from bs4 import BeautifulSoup

GITHUB_EXPLORE_PAGE = 'https://github.com/explore'

def get_html_explore():
    response = requests.get(GITHUB_EXPLORE_PAGE)
    return response.content

def parse_html(content):
    soup = BeautifulSoup(content)
    trending_repo_div = soup.find('div', {'class' : 'repo-collection'})
    return trending_repo_div.findAll('li', {'class' : 'collection-item'})

def repo_breakdown(repo):
    header = repo.find('a', {'class' : 'repo-name'})
    forks, stars = repo.findAll('span', {'class' : 'collection-stat'})
    repo_details = header.text.split("/")

    return {'user': repo_details[0], 'project': repo_details[1], 'forks': forks.text, 'stars': 'stars.text' }


def get_data(repos):
    treding_repos = []
    for repo in repos:
      data = repo_breakdown(repo)
      treding_repos.append(data)
    return treding_repos

def main():
    content = get_html_explore()
    repos = parse_html(content)
    print get_data(repos)

if __name__ == '__main__':
    main()
	import requests

	from bs4 import BeautifulSoup

	GITHUB_EXPLORE_PAGE = 'https://github.com/explore'

	def get_html_explore():
	response = requests.get(GITHUB_EXPLORE_PAGE)
	return response.content

	def parse_html(content):
	soup = BeautifulSoup(content)
	trending_repo_div = soup.find('div', {'class' : 'repo-collection'})
	return trending_repo_div.findAll('li', {'class' : 'collection-item'})

	def repo_breakdown(repo):
	header = repo.find('a', {'class' : 'repo-name'})
	forks, stars = repo.findAll('span', {'class' : 'collection-stat'})
	repo_details = header.text.split("/")

	return {'user': repo_details[0], 'project': repo_details[1], 'forks': forks.text, 'stars': 'stars.text' }


	def get_data(repos):
	treding_repos = []
	for repo in repos:
	data = repo_breakdown(repo)
	treding_repos.append(data)
	return treding_repos

	def main():
	content = get_html_explore()
	repos = parse_html(content)
	print get_data(repos)

	if __name__ == '__main__':
	main()