rajacsp/title_collector.py

## title_collector.py
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.support.select import Select
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC

def startpy():
    phantomjs_path = r'C:\Phantom\phantomjs-2.1.1-windows\bin\phantomjs.exe';
    driver = webdriver.PhantomJS(phantomjs_path)
    wait = WebDriverWait(driver, 10)
    url = 'https://technet.microsoft.com/en-us/library/aa995718(v=exchg.65).aspx'
    driver.get(url)

    pagehtml = driver.page_source;
    soup = BeautifulSoup(pagehtml, "html5lib")

    titles = soup.findAll('h1');
    for child in titles:
        print(child.get_text());

if __name__ == '__main__':
    startpy()
	from bs4 import BeautifulSoup
	from selenium import webdriver
	from selenium.webdriver.common.by import By
	from selenium.webdriver.support.select import Select
	from selenium.webdriver.support.ui import WebDriverWait
	from selenium.webdriver.support import expected_conditions as EC

	def startpy():
	phantomjs_path = r'C:\Phantom\phantomjs-2.1.1-windows\bin\phantomjs.exe';
	driver = webdriver.PhantomJS(phantomjs_path)
	wait = WebDriverWait(driver, 10)
	url = 'https://technet.microsoft.com/en-us/library/aa995718(v=exchg.65).aspx'
	driver.get(url)

	pagehtml = driver.page_source;
	soup = BeautifulSoup(pagehtml, "html5lib")

	titles = soup.findAll('h1');
	for child in titles:
	print(child.get_text());

	if __name__ == '__main__':
	startpy()