AlJohri/scrape_presidential_debates.py

## scrape_presidential_debates.py
import requests
from bs4 import BeautifulSoup

url = 'https://www.presidency.ucsb.edu/documents/presidential-documents-archive-guidebook/presidential-candidates-debates-1960-2016'
response = requests.get(url)

soup = BeautifulSoup(response.text, 'html.parser')
for tr in soup.select('.field-body > table > tbody > tr > td > table > tbody > tr > td > table > tbody > tr'):
    columns = tr.select('td')
    if len(columns) == 1: continue
    elif any(x.get('colspan') or x.get('rowspan') or x.select('img') for x in columns): continue
    elif len(columns) == 3:
        year, date, url = columns
    elif len(columns) == 2:
        date, url = columns

    date = date.text
    url = url.find('a').get('href')

    print(date, url)
	import requests
	from bs4 import BeautifulSoup

	url = 'https://www.presidency.ucsb.edu/documents/presidential-documents-archive-guidebook/presidential-candidates-debates-1960-2016'
	response = requests.get(url)

	soup = BeautifulSoup(response.text, 'html.parser')
	for tr in soup.select('.field-body > table > tbody > tr > td > table > tbody > tr > td > table > tbody > tr'):
	columns = tr.select('td')
	if len(columns) == 1: continue
	elif any(x.get('colspan') or x.get('rowspan') or x.select('img') for x in columns): continue
	elif len(columns) == 3:
	year, date, url = columns
	elif len(columns) == 2:
	date, url = columns

	date = date.text
	url = url.find('a').get('href')

	print(date, url)