jakebox/pdf_parser.py

## pdf_parser.py
###
### PDF Parser/Downloader
### By Jake B - December 2019
###

import os
import requests
import PyPDF2
import re

# Downloads the menu and saves it as a PDF
url = 'URL OF PDF GOES HERE'
filename = "lunch.pdf"
r = requests.get(url, allow_redirects = True)
open(filename, 'wb').write(r.content)

# Loading the file and grabbing the first page into a string
lunchList = open(filename,'rb')
read_pdf = PyPDF2.PdfFileReader(lunchList)
page = read_pdf.getPage(0)
page_content = page.extractText()

# Prints the PDF's content
print(page_content)
	###
	### PDF Parser/Downloader
	### By Jake B - December 2019
	###

	import os
	import requests
	import PyPDF2
	import re

	# Downloads the menu and saves it as a PDF
	url = 'URL OF PDF GOES HERE'
	filename = "lunch.pdf"
	r = requests.get(url, allow_redirects = True)
	open(filename, 'wb').write(r.content)

	# Loading the file and grabbing the first page into a string
	lunchList = open(filename,'rb')
	read_pdf = PyPDF2.PdfFileReader(lunchList)
	page = read_pdf.getPage(0)
	page_content = page.extractText()

	# Prints the PDF's content
	print(page_content)