Ettore Rizza ettorerizza

## marc2csv_mcmaster.py
#!/usr/bin/env python

import csv
from pymarc import MARCReader
from os import listdir
from re import search

# change this line to match your folder structure
SRC_DIR = '/path/to/mrc/records'

## import_viaf.pl
#!/usr/bin/env perl
#
# Match authors against VIAF
#
# License: http://dev.perl.org/licenses/artistic.html
#
# Author: Patrick Hochstenbach <Patrick.Hochstenbach@UGent.be>
#
# Apr 2015
$|++;

## xml_split.py
#!/usr/bin/env python

import os
import xml.parsers.expat
from xml.sax.saxutils import escape
from optparse import OptionParser
from math import log10


# How much data we process at a time

## gist:a54ccefbb1059becd0e4fd41f82bc2be
<qualifieddc xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1" xmlns:dcterms="http://purl.org/dc/terms" xmlns:marcrel="http://www.loc.gov/marc.relators" xsi:schemaLocation="http://www.loc.gov/marc.relators http://imlsdcc2.grainger.illinois.edu/registry/marcrel.xsd" xsi:noNamespaceSchemaLocation="http://dublincore.org/schemas/xmls/qdc/2008/02/11/qualifieddc.xsd">
{{forNonBlank(cells["id"], v, "<dc:identifier>"+v.value+"</dc:identifier>", "")}}
{{forNonBlank(cells["Title"], v, "<dc:title>"+v.value+"</dc:title>", "")}}
{{forNonBlank(cells["Creator"], v, "<dc:creator>"+v.value+"</dc:creator>", "")}}
{{forNonBlank(cells["Date"], v, "<dc:date>"+v.value+"</dc:date>", "")}}
{{forNonBlank(cells["Description"], v, "<dc:description>"+v.value+"</dc:description>", "")}}
{{forNonBlank(cells["Description2"], v, "<dc:description>"+v.value+"</dc:description>", "")}}
{{forNonBlank(cells["Rights"], v, "<dc:rights>"+v.value+"</dc:rights>", "")}}
{{forNonBlank(cells["Type"], v, "<dc:

## airbnb.r
library(stringr)
library(purrr)
library(rvest)

#------------------------------------------------------------------------------#
# Author: Andrew Do
# Purpose: A bunch of utility functions for the main ScrapeCityToPage The goal
# is to be able to scrape up to a specified page number for a given city and
# then to store that information as a data frame.  The resulting data frame will
# be raw and will require additional cleaning, but the structure is more or less
	#!/usr/bin/env python

	import csv
	from pymarc import MARCReader
	from os import listdir
	from re import search

	# change this line to match your folder structure
	SRC_DIR = '/path/to/mrc/records'
	#!/usr/bin/env perl
	#
	# Match authors against VIAF
	#
	# License: http://dev.perl.org/licenses/artistic.html
	#
	# Author: Patrick Hochstenbach <Patrick.Hochstenbach@UGent.be>
	#
	# Apr 2015
	$\|++;
	#!/usr/bin/env python

	import os
	import xml.parsers.expat
	from xml.sax.saxutils import escape
	from optparse import OptionParser
	from math import log10


	# How much data we process at a time
	<qualifieddc xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1" xmlns:dcterms="http://purl.org/dc/terms" xmlns:marcrel="http://www.loc.gov/marc.relators" xsi:schemaLocation="http://www.loc.gov/marc.relators http://imlsdcc2.grainger.illinois.edu/registry/marcrel.xsd" xsi:noNamespaceSchemaLocation="http://dublincore.org/schemas/xmls/qdc/2008/02/11/qualifieddc.xsd">
	{{forNonBlank(cells["id"], v, "<dc:identifier>"+v.value+"</dc:identifier>", "")}}
	{{forNonBlank(cells["Title"], v, "<dc:title>"+v.value+"</dc:title>", "")}}
	{{forNonBlank(cells["Creator"], v, "<dc:creator>"+v.value+"</dc:creator>", "")}}
	{{forNonBlank(cells["Date"], v, "<dc:date>"+v.value+"</dc:date>", "")}}
	{{forNonBlank(cells["Description"], v, "<dc:description>"+v.value+"</dc:description>", "")}}
	{{forNonBlank(cells["Description2"], v, "<dc:description>"+v.value+"</dc:description>", "")}}
	{{forNonBlank(cells["Rights"], v, "<dc:rights>"+v.value+"</dc:rights>", "")}}
	{{forNonBlank(cells["Type"], v, "<dc:
	library(stringr)
	library(purrr)
	library(rvest)

	#------------------------------------------------------------------------------#
	# Author: Andrew Do
	# Purpose: A bunch of utility functions for the main ScrapeCityToPage The goal
	# is to be able to scrape up to a specified page number for a given city and
	# then to store that information as a data frame. The resulting data frame will
	# be raw and will require additional cleaning, but the structure is more or less