CHARITH1995/web-scrapping.py

## web-scrapping.py
from bs4 import BeautifulSoup
import time
from selenium import webdriver
import MySQLdb
from datetime import datetime
import csv

url = "http://sinhala.adaderana.lk/sinhala-hot-news.php"  #this is website url

db = MySQLdb.connect(host="localhost",
                     user="root",
                     passwd="",
                     db="research",
					 charset='utf8',
                     use_unicode=True)

# create a Cursor object
cur = db.cursor()


driver = webdriver.Firefox(executable_path=r'D:\apps\anaconda\geckodriver.exe') #above website is a javascript enable one.Therefore we webdriver use.
driver.get(url)
time.sleep(5)
htmlSource = driver.page_source
soup = BeautifulSoup(htmlSource, 'lxml')
type(soup)
#title = soup.title
all_div = soup.find_all("div",{"class" : "news-story"}) #div tags depends on your website
	from bs4 import BeautifulSoup
	import time
	from selenium import webdriver
	import MySQLdb
	from datetime import datetime
	import csv

	url = "http://sinhala.adaderana.lk/sinhala-hot-news.php" #this is website url

	db = MySQLdb.connect(host="localhost",
	user="root",
	passwd="",
	db="research",
	charset='utf8',
	use_unicode=True)

	# create a Cursor object
	cur = db.cursor()


	driver = webdriver.Firefox(executable_path=r'D:\apps\anaconda\geckodriver.exe') #above website is a javascript enable one.Therefore we webdriver use.
	driver.get(url)
	time.sleep(5)
	htmlSource = driver.page_source
	soup = BeautifulSoup(htmlSource, 'lxml')
	type(soup)
	#title = soup.title
	all_div = soup.find_all("div",{"class" : "news-story"}) #div tags depends on your website