kozmonaut/scrape.py

## scrape.py
from bs4 import BeautifulSoup
import csv
import re
import requests

# Copy URL you wanna crawl
print ("Copy the link you wanna scrap:")
url = raw_input("->")
# Fetch url
request = requests.get(url)
# All in text
plain = request.text
# Make sa soup
soup = BeautifulSoup(plain)

# Open file for writting results
f = open("result.html", "w")

# Type the term you wanna use for search
term = "someterm"
# Use regex for filtering
links = soup.find_all(href=re.compile(term))
# Go through all links
for link in links:
	fullLink = link.get('href')
	# Write links into file
	f.write(fullLink + '\n')

f.close()
	from bs4 import BeautifulSoup
	import csv
	import re
	import requests

	# Copy URL you wanna crawl
	print ("Copy the link you wanna scrap:")
	url = raw_input("->")
	# Fetch url
	request = requests.get(url)
	# All in text
	plain = request.text
	# Make sa soup
	soup = BeautifulSoup(plain)

	# Open file for writting results
	f = open("result.html", "w")

	# Type the term you wanna use for search
	term = "someterm"
	# Use regex for filtering
	links = soup.find_all(href=re.compile(term))
	# Go through all links
	for link in links:
	fullLink = link.get('href')
	# Write links into file
	f.write(fullLink + '\n')

	f.close()