Skip to content

Instantly share code, notes, and snippets.

@mrmiguez
Created February 17, 2022 17:19
Show Gist options
  • Save mrmiguez/eea788e03b23e8b44657ee628737f5f7 to your computer and use it in GitHub Desktop.
Save mrmiguez/eea788e03b23e8b44657ee628737f5f7 to your computer and use it in GitHub Desktop.
from collections import namedtuple
DataProvider = namedtuple('DataProvider', 'code oai_url mdprefix oai_sets')
OAI_DICT = {
'boynton': DataProvider('boynton',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['boy']),
'brockway': DataProvider('brockway',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['bml']),
'broward': DataProvider('broward',
'https://broward.digital.flvc.org/oai2',
'mods',
['broward_scrapbcol', 'broward_thumacol',
'broward_ephemera', 'broward_55',
'broward_butterflycol', 'broward_pankucol',
'broward_theobservercol', 'broward_phoenix',
'broward_venetiancrier', 'broward_newhorizons',
'broward_polaris']),
'comb': DataProvider('comb',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['imbda']),
'coral_gables': DataProvider('coral_gables',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['cgm']),
'fau': DataProvider('fau',
'https://fau.digital.flvc.org/oai2',
'mods',
['fau_kemery', 'fau_ycb', 'fau_floridabooks',
'fau_allweiner', 'fau_depthistory']),
'fgcu': DataProvider('fgcu',
'https://fgcu.digital.flvc.org/oai2',
'mods',
['fgcu_020306', 'fgcu_0217', 'fgcu_0215', 'fgcu_0216',
'fgcu_blackhistorysociety', 'fgcu_020302',
'fgcu_020301']),
'mbvm': DataProvider('mbvm',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['mbvm']),
'fiu': DataProvider('fiu',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['bzs', 'doc', 'fls', 'glows', 'iif', 'lgcf', 'llsm',
'lter', 'mca', 'phc', 'ps', 'rte', 'serc', 'sfnrc',
'sfwmd', 'spc', 'two', 'ua', 'vms', 'zoo']),
'fscj': DataProvider('fscj',
'https://fscj.digital.flvc.org/oai2',
'mods',
['fscj_164', 'fscj_alpha', 'fscj_3', 'fscj_59329',
'fscj_13557', 'fscj_59223', 'fscj_collegehistory',
'fscj_33058', 'fscj_orionis', 'fscj_athletics',
'fscj_danceworks', 'fscj_dramaWORKS',
'fscj_studentresearchconference',
'fscj_summermusicaltheatreexperience', 'fscj_band']),
'fsu': DataProvider('fsu',
'https://diginole.lib.fsu.edu/oai2',
'mods',
['fsu_digital_library']),
'gnmhs': DataProvider('gnmhs',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['ignmhs']),
'hialeah': DataProvider('hialeah',
'http://cdm17339.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['p17339coll1']),
'hmm': DataProvider('hmm',
'http://cdm17191.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['hmm0001']),
'ir_fiu': DataProvider('ir_fiu',
'https://digitalcommons.fiu.edu/do/oai/',
'qdc',
['publication:dpla_harvest']),
'leesburg': DataProvider('leesburg',
'http://cdm16937.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['p16937coll2', 'p16937coll3', 'p16937coll7',
'p16937coll6']),
'mcpl': DataProvider('mcpl',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['mile']),
'mdpl': DataProvider('mdpl',
'http://cdm17273.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['p17273coll9', 'p17273coll8', 'p17273coll7',
'p17273coll6', 'p17273coll5', 'p17273coll4',
'p17273coll3', 'p17273coll2', 'p17273coll18',
'p17273coll17', 'p17273coll16', 'p17273coll15',
'p17273coll13', 'p17273coll11', 'p17273coll10',
'p17273coll1', 'p17273coll19', 'p17273coll14',
'p17273coll23', 'p17273coll20', 'p17273coll12',
'p17273coll24', 'p17273coll25', 'p17273coll22',
'p17273coll26', 'p17273coll27']),
'ringling': DataProvider('ringling',
'https://diginole.lib.fsu.edu/oai2',
'mods',
['fsu_ringlingmain']),
'um': DataProvider('um',
'http://cdm17191.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['chc5314', 'arc5100', 'arc5200', 'arc5300',
'arcdigital', 'asm0015', 'asm0034', 'asm0037',
'asm0038', 'asm0055', 'asm0060', 'asm0075', 'asm0085',
'asm0179', 'asm0216', 'asm0261', 'asm0286', 'asm0299',
'asm0300', 'asm0301', 'asm0304', 'asm0341', 'asm0344',
'asm0383', 'asm0400', 'asm0409', 'asm0410', 'asm0447',
'asm0471', 'asm0480', 'asm0491', 'asm0530', 'asm0566',
'asm0567', 'asm0569', 'asm0570', 'asm0610', 'asm0636',
'asm0650', 'asm0655', 'asm0656', 'asm0700', 'asm0713',
'asm0717', 'asm5000', 'asu0010', 'asu0017', 'asu0058',
'asu0281', 'asu0651', 'asu0654', 'chc0015', 'chc0111',
'chc0124', 'chc0126', 'chc0170', 'chc0184', 'chc0189',
'chc0193', 'chc0218', 'chc0219', 'chc0336', 'chc0339',
'chc0347', 'chc0356', 'chc0359', 'chc0364', 'chc0380',
'chc0398', 'chc0400', 'chc0460', 'chc0468', 'chc0484',
'chc0487', 'chc5006', 'chc5010', 'chc5017', 'chc5047',
'chc5061', 'chc5066', 'chc5122', 'chc5123', 'chc5143',
'chc5209', 'chc5212', 'chc5223', 'chc5252', 'chc5260',
'chc5277', 'chc5278', 'chc5298', 'chc5299', 'chc5312',
'chc5313', 'chc5324', 'chc5352', 'chc5372', 'chc5376',
'chc9999', 'cubanlaw', 'cubanphotos', 'dplaper',
'asm0033', 'pamphlets', 'asm0157', 'rsmasphotos',
'chc5293', 'asc9999', 'sutherland', 'swingle',
'theater', 'tobaccoart', 'umphotos', 'asm0188']),
'unf': DataProvider('unf',
'https://digitalcommons.unf.edu/do/oai',
'simple-dublin-core'
['publication:archbishoptutupapers',
'publication:absmithletters', 'publication:solleetext',
'publication:eartha_books', 'publication:eartha_audio',
'publication:eartha_materials', 'publication:halyard',
'publication:rthomas', 'publication:yearbooks',
'publication:sollee', 'publication:johnston_text',
'publication:aalic', 'publication:abt',
'publication:eartha_images']),
'usf': DataProvider('usf',
'https://digital.lib.usf.edu/SobekCM_oai.aspx',
'oai_dc',
['cape-canaveral-3d', 'hadobson-papers', 'ohp-ybor',
'snaps', 'alicia', 'allsportslibrary', 'yorkunas',
'americanindianweekly', 'slaymakera',
'army-navy-weekly', 'elaudaz', 'audubonfl',
'tavernier', 'beadle-boys', 'brahman', 'braveandbold',
'buffalobillstories', 'burgert', 'ohp-carltonanthony',
'catesby', 'ohp-celtic', 'cedr',
'centroasturiano-mbrs', 'ringlingfamily',
'childrens-lit', 'fl-local-histories',
'columbia-gonzmart', 'ohp-columbia', 'ohp-liberators',
'cubanrevolutionaries', 'his-dave-porter',
'deadwooddicklibrary', 'diamonddickjr', 'ladifesa',
'boucicault', 'disparo', 'bentz', 'echoes', 'wagner',
'maps-early', 'ensminger', 'elapp', 'ohp-elapp',
'exlibris', 'eyeofthebeast', 'fame-fortune-weekly',
'karam', 'fccdrc', 'fcst', 'ohp-flcitrus',
'ohp-flcivilright', 'ohp-flfoodfamilies',
'johnscommittee', 'fl-libraryhistory', 'maps-florida',
'ohp-coph', 'fl-sentinel', 'fl-slavenarratives',
'fmhi-lectures', 'thompsonpapers', 'frankreadelibrary',
'lagaceta', 'whitecartoons', 'gordonkellernursing',
'arch-stpete-parks', 'huaca-soto', 'karst',
'ohp-karst', 'naturalhazardscenter', 'davis',
'rpallen', 'mvi-sustainfutures', 'ohp-tampabayestuary',
'usf-paleontology', 'graber', 'dunn-postcards',
'dunn-photouring', 'hillsboroughmarriage',
'hc-tampa-maps', 'hillsboroughnatural', 'hipple',
'ybor-walkingtour', 'ohp-holocaustsurvive',
'irish-studies', 'jessejamesstories',
'jwegerton-papers', 'korad', 'legioniefalangi',
'lemur', 'lgbt', 'ohp-lgbt', 'libertyboys', 'buck',
'naturalhazardscenter', 'nickcarterweekly',
'ohp-oculina', 'old-cap-collier', 'oldsleuth',
'oracle', 'osterweil', 'oteroycolominas',
'ohp-otisanthony', 'pluckandluck', 'qubit',
'larevista', 'maniscalcor', 'helps-robert',
'robertsonandfresh', 'pagan-shrine',
'sacred-leaves-sympos', 'sacred-leaves-manusc',
'sallybirdhowry', 'watt', 'zylstra', 'scifi',
'secretservice-bradys', 'sfra-newsletter',
'shieldweekly', 'showmens', 'ohp-showmens',
'skip-gandy', 'spanishcivilwar', 'ohp-spanishcivilwar',
'starryflagweekly', 'mvi-stateofwater', 'stokes',
'ohp-sulphursprings', 'suniland', 'sunland-tribune',
'ohp-tampaarts', 'tampabayhistoryjrnl', 'cigars',
'tampailustrado', 'tampa-life', 'ohp-freedman',
'tampanativesshow', 'wpa-papers', 'latinoperiodicals',
't-terrace-sentinel', 'trse', 'tiptopweekly',
'tobaccoleafjournal', 'mvi-tropicalecology',
'tyndalltarget', 'ohp-usf25', 'ohp-usf50',
'usf-archives', 'accent-on-learning', 'cota',
'ohp-csd50th', 'usf-fact-book', 'usf-liblectures',
'ohp-usfhistory', 'usfphotos', 'usf-student-news',
'usfwomen', 'usf-yearbooks', 'cutr', 'jsallen-papers',
'volcanic-lightning', 'darfuridrawings', 'wehman',
'ohp-westcentralfl', 'wide-awake-weekly',
'wildwestweekly', 'yankeedoodle', 'youngklondike',
'youngroughriders', 'progress-village']),
'vhlf': DataProvider('vhlf',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['hco'])
}
OUT_PATH = '/opt/ssdn/OAI_export/'
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment