tbbooher/read_edmunds.py

## read_edmunds.py
from bs4 import BeautifulSoup
import csv
import re

with open('edmunds.html', 'r') as f:
    html = f.read()

soup = BeautifulSoup(html, 'html.parser')

results = []

for vehicle in soup.find_all("div", class_="vehicle-info"):
    title = re.sub(r'\s+', ' ', vehicle.find("div",
                   class_="text-blue-50").text.strip())
    desc = re.sub(r'\s+', ' ', vehicle.find("div",
                  class_="text-gray-dark").text.strip())
    price = vehicle.find("span", class_="heading-3").text.strip()
    span = vehicle.find("span", title="Car Mileage")
    if span is not None:
        mileage = span.find_next_sibling("span").text.strip()
    else:
        mileage = "N/A"
    print("Title:", title)
    print("Desc:", desc)
    print("Price:", price)
    print("Miles:", mileage)

    result = [title, desc, price, mileage]
    results.append(result)


for result in results:
    print(result)

# create a csv of the results
with open('output_edmunds.csv', 'w', newline='') as f:
    writer = csv.writer(f)
    writer.writerow(['Title', 'Desc', 'Price', 'Condition'])
    writer.writerows(results)
	from bs4 import BeautifulSoup
	import csv
	import re

	with open('edmunds.html', 'r') as f:
	html = f.read()

	soup = BeautifulSoup(html, 'html.parser')

	results = []

	for vehicle in soup.find_all("div", class_="vehicle-info"):
	title = re.sub(r'\s+', ' ', vehicle.find("div",
	class_="text-blue-50").text.strip())
	desc = re.sub(r'\s+', ' ', vehicle.find("div",
	class_="text-gray-dark").text.strip())
	price = vehicle.find("span", class_="heading-3").text.strip()
	span = vehicle.find("span", title="Car Mileage")
	if span is not None:
	mileage = span.find_next_sibling("span").text.strip()
	else:
	mileage = "N/A"
	print("Title:", title)
	print("Desc:", desc)
	print("Price:", price)
	print("Miles:", mileage)

	result = [title, desc, price, mileage]
	results.append(result)


	for result in results:
	print(result)

	# create a csv of the results
	with open('output_edmunds.csv', 'w', newline='') as f:
	writer = csv.writer(f)
	writer.writerow(['Title', 'Desc', 'Price', 'Condition'])
	writer.writerows(results)