misterhay/marking.py

## marking.py
import os
import pdfplumber
from spellchecker import SpellChecker
spell = SpellChecker()

for path, directories, files in os.walk('.'):
    for filename in files:
        if filename.endswith('.pdf'):
            filepath = path + os.sep + filename
            student = path.split('- ')[1].strip() # get the student name from the directory name
            text = ''
            with pdfplumber.open(filepath) as pdf:
                for page in pdf.pages:
                    text = text + page.extract_text(x_tolerance=3, y_tolerance=3)
            print(student, '-', filename)
            print(text)
        if filename.endswith('.docx'):
            pass
        if filename.endswith('.txt'):
            with open(filepath, 'r') as textfile:
                text = textfile.read()
        # count words

        # spell check
        misspelled = spell.unknown(text)
        print(misspelled)

        # sentence lengths

        # sentence starters
	import os
	import pdfplumber
	from spellchecker import SpellChecker
	spell = SpellChecker()

	for path, directories, files in os.walk('.'):
	for filename in files:
	if filename.endswith('.pdf'):
	filepath = path + os.sep + filename
	student = path.split('- ')[1].strip() # get the student name from the directory name
	text = ''
	with pdfplumber.open(filepath) as pdf:
	for page in pdf.pages:
	text = text + page.extract_text(x_tolerance=3, y_tolerance=3)
	print(student, '-', filename)
	print(text)
	if filename.endswith('.docx'):
	pass
	if filename.endswith('.txt'):
	with open(filepath, 'r') as textfile:
	text = textfile.read()
	# count words

	# spell check
	misspelled = spell.unknown(text)
	print(misspelled)

	# sentence lengths

	# sentence starters