pdftotext -enc UTF-8 -layout payroll2013.pdf
requires pdftotext from poppler
and this txt file
<a href="" class="toggle"><span class="top"></span><span class="middle"></span><span class="bottom"></span></a> |
UPDATE wp_posts SET ping_status='closed' WHERE post_status = 'publish' AND post_type = 'post'; | |
UPDATE wp_posts SET ping_status='closed' WHERE post_status = 'publish' AND post_type = 'page'; |
<!DOCTYPE html> | |
<meta charset="utf-8"> | |
<style> | |
.schooldistrict { | |
fill: #eee; | |
stroke: #777; | |
} | |
.schooldistrict:hover { | |
fill: steelblue; |
<!DOCTYPE html> | |
<meta charset="utf-8"> | |
<style> | |
.lake { | |
fill: steelblue;; | |
} | |
.river { | |
fill: none; | |
stroke: #777; | |
} |
01C019105 | |
01C022105 | |
01C024105 | |
01C028105 | |
01C029105 | |
01C032105 | |
01I004105 | |
01I004705 | |
01I011105 | |
01I011205 |
import subprocess | |
import glob | |
for file in glob.glob("afgradespdfs/*.pdf"): | |
cmd = 'pdftotext -enc UTF-8 -layout %s' % (file) | |
run = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE) | |
out, err = run.communicate() | |
# display errors if they occur | |
if err: |
import csv | |
import glob | |
def lineParse(line): | |
return lines[line].strip() | |
def lineSpliceParse(line, start, stop): | |
return str(lines[line].strip()[start:stop]).strip() | |
high = [] |
year | Magnitude-1 | Magnitude-2 | Magnitude-3 | Magnitude-4 | |
---|---|---|---|---|---|
2000 | 8 | 9 | 1 | 0 | |
2001 | 16 | 14 | 0 | 0 | |
2002 | 22 | 17 | 3 | 0 | |
2003 | 22 | 25 | 0 | 0 | |
2004 | 30 | 32 | 2 | 0 | |
2005 | 12 | 7 | 2 | 0 | |
2006 | 6 | 12 | 3 | 0 | |
2007 | 5 | 23 | 1 | 0 | |
2008 | 2 | 20 | 2 | 0 |
<!DOCTYPE html> | |
<meta charset="utf-8"> | |
<style> | |
.schooldistrict { | |
stroke: #000; | |
} | |
.schooldistrictv1, .schooldistrictv2 { | |
opacity: .5; | |
} |