Skip to content

Instantly share code, notes, and snippets.

@mrmiguez
Created January 28, 2021 23:31
Show Gist options
  • Save mrmiguez/ebe2c320bc7f2f626245265fd8bcf122 to your computer and use it in GitHub Desktop.
Save mrmiguez/ebe2c320bc7f2f626245265fd8bcf122 to your computer and use it in GitHub Desktop.
from collections import namedtuple
DataProvider = namedtuple('DataProvider', 'code oai_url mdprefix oai_sets')
OAI_DICT = {
'boynton': DataProvider('boynton',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['boy']),
'brockway': DataProvider('brockway',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['bml']),
'broward': DataProvider('broward',
'https://broward.digital.flvc.org/oai2',
'mods',
['broward_scrapbcol', 'broward_thumacol',
'broward_ephemera', 'broward_55',
'broward_butterflycol', 'broward_pankucol',
'broward_theobservercol']),
'coral_gables': DataProvider('coral_gables',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['cgm']),
'fau': DataProvider('fau',
'https://fau.digital.flvc.org/oai2',
'mods',
['fau_kemery', 'fau_ycb', 'fau_floridabooks', 'fau_allweiner']),
'fgcu': DataProvider('fgcu',
'https://fgcu.digital.flvc.org/oai2',
'mods',
['fgcu_020306', 'fgcu_0217', 'fgcu_0215', 'fgcu_0216',
'fgcu_blackhistorysociety', 'fgcu_020302',
'fgcu_020301']),
'mbvm': DataProvider('mbvm',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['mbvm']),
'fiu': DataProvider('fiu',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['bzs', 'doc', 'fls', 'glows', 'iif', 'lgcf', 'llsm',
'lter', 'mca', 'phc', 'ps', 'rte', 'serc', 'sfnrc',
'sfwmd', 'spc', 'two', 'ua', 'vms', 'zoo']),
'fscj': DataProvider('fscj',
'https://fscj.digital.flvc.org/oai2',
'mods',
['fscj_164', 'fscj_alpha', 'fscj_3', 'fscj_59329',
'fscj_13557', 'fscj_59223', 'fscj_collegehistory',
'fscj_33058', 'fscj_orionis', 'fscj_athletics',
'fscj_danceworks', 'fscj_dramaWORKS',
'fscj_studentresearchconference']),
'fsu': DataProvider('fsu',
'https://fsu.digital.flvc.org/oai2',
'mods',
['fsu_digital_library']),
'gnmhs': DataProvider('gnmhs',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['ignmhs']),
'hialeah': DataProvider('hialeah',
'http://cdm17339.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['p17339coll1']),
'hmm': DataProvider('hmm',
'http://cdm17191.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['hmm0001']),
'ir_fiu': DataProvider('ir_fiu',
'https://digitalcommons.fiu.edu/do/oai/',
'qdc',
['publication:chue_archive', 'publication:crivideo',
'publication:cuba_poll', 'publication:ecohumanities',
'publication:ecohumanities_images',
'publication:economics_ops', 'publication:economics_wps',
'publication:ecxdpeb', 'publication:etd',
'publication:fce_lter_photos',
'publication:fce_lter_proposals_reports',
'publication:fiu_images', 'publication:fiu_video',
'publication:fiuinview', 'publication:frostcatalogs',
'publication:laccops', 'publication:laccopsd',
'publication:laccwps', 'publication:mpo_broward',
'publication:mpo_dade', 'publication:mpo_palmbeach',
'publication:research_reports', 'publication:sercrp',
'publication:serials', 'publication:sgabbc_images',
'publication:spain_videos', 'publication:theatre_images',
'publication:theatre_posters',
'publication:theatre_programs', 'publication:yearbooks']),
'mcpl': DataProvider('mcpl',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['mile']),
'mdpl': DataProvider('mdpl',
'http://cdm17273.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['p17273coll9', 'p17273coll8', 'p17273coll7',
'p17273coll6', 'p17273coll5', 'p17273coll4',
'p17273coll3', 'p17273coll2', 'p17273coll18',
'p17273coll17', 'p17273coll16', 'p17273coll15',
'p17273coll13', 'p17273coll11', 'p17273coll10',
'p17273coll1', 'p17273coll19', 'p17273coll14',
'p17273coll23', 'p17273coll20', 'p17273coll12',
'p17273coll24']),
'um': DataProvider('um',
'http://cdm17191.contentdm.oclc.org/oai/oai.php',
'oai_qdc',
['chc5314', 'arc5100', 'arc5200', 'arc5300',
'arcdigital', 'asm0015', 'asm0034', 'asm0037', 'asm0038',
'asm0055', 'asm0060', 'asm0075', 'asm0085', 'asm0179',
'asm0216', 'asm0261', 'asm0286', 'asm0299', 'asm0300',
'asm0301', 'asm0304', 'asm0341', 'asm0344', 'asm0383',
'asm0400', 'asm0409', 'asm0410', 'asm0447', 'asm0471',
'asm0480', 'asm0491', 'asm0530', 'asm0566', 'asm0567',
'asm0569', 'asm0570', 'asm0610', 'asm0636', 'asm0650',
'asm0655', 'asm0656', 'asm0700', 'asm0713', 'asm0717',
'asm5000', 'asu0010', 'asu0017', 'asu0058', 'asu0281',
'asu0651', 'asu0654', 'chc0015', 'chc0111', 'chc0124',
'chc0126', 'chc0170', 'chc0184', 'chc0189', 'chc0193',
'chc0218', 'chc0219', 'chc0336', 'chc0339', 'chc0347',
'chc0356', 'chc0359', 'chc0364', 'chc0380', 'chc0398',
'chc0400', 'chc0460', 'chc0468', 'chc0484', 'chc0487',
'chc5006', 'chc5010', 'chc5017', 'chc5047', 'chc5061',
'chc5066', 'chc5122', 'chc5123', 'chc5143', 'chc5209',
'chc5212', 'chc5223', 'chc5252', 'chc5260', 'chc5277',
'chc5278', 'chc5298', 'chc5299', 'chc5312', 'chc5313',
'chc5324', 'chc5352', 'chc5372', 'chc5376', 'chc9999',
'cubanlaw', 'cubanphotos', 'dplaper', 'asm0033',
'pamphlets', 'asm0157', 'rsmasphotos', 'chc5293',
'asc9999', 'sutherland', 'swingle', 'theater',
'tobaccoart', 'umphotos', 'asm0188']),
'unf': DataProvider('unf',
'https://digitalcommons.unf.edu/do/oai',
'simple-dublin-core',
['publication:archbishoptutupapers',
'publication:absmithletters', 'publication:solleetext',
'publication:eartha_books', 'publication:eartha_audio',
'publication:eartha_materials', 'publication:halyard',
'publication:rthomas', 'publication:yearbooks']),
'usf': DataProvider('usf',
'https://digital.lib.usf.edu/SobekCM_oai.aspx',
'oai_dc',
['cape-canaveral-3d', 'hadobson-papers', 'ohp-ybor',
'snaps', 'alicia', 'allsportslibrary', 'yorkunas',
'americanindianweekly', 'slaymakera', 'army-navy-weekly',
'elaudaz', 'audubonfl', 'tavernier', 'beadle-boys',
'brahman', 'braveandbold', 'buffalobillstories',
'burgert', 'ohp-carltonanthony', 'catesby', 'ohp-celtic',
'cedr', 'centroasturiano-mbrs', 'ringlingfamily',
'childrens-lit', 'fl-local-histories', 'columbia-gonzmart',
'ohp-columbia', 'ohp-liberators', 'cubanrevolutionaries',
'his-dave-porter', 'deadwooddicklibrary', 'diamonddickjr',
'ladifesa', 'boucicault', 'disparo', 'bentz', 'echoes',
'wagner', 'maps-early', 'ensminger', 'elapp', 'ohp-elapp',
'exlibris', 'eyeofthebeast', 'fame-fortune-weekly',
'karam', 'fccdrc', 'fcst', 'ohp-flcitrus',
'ohp-flcivilright', 'ohp-flfoodfamilies', 'johnscommittee',
'fl-libraryhistory', 'maps-florida', 'ohp-coph',
'fl-sentinel', 'fl-slavenarratives', 'fmhi-lectures',
'thompsonpapers', 'frankreadelibrary', 'lagaceta',
'whitecartoons', 'gordonkellernursing',
'arch-stpete-parks', 'huaca-soto', 'karst', 'ohp-karst',
'naturalhazardscenter', 'davis', 'rpallen',
'mvi-sustainfutures', 'ohp-tampabayestuary',
'usf-paleontology', 'graber', 'dunn-postcards',
'dunn-photouring', 'hillsboroughmarriage',
'hc-tampa-maps', 'hillsboroughnatural', 'hipple',
'ybor-walkingtour', 'ohp-holocaustsurvive',
'irish-studies', 'jessejamesstories', 'jwegerton-papers',
'korad', 'legioniefalangi', 'lemur', 'lgbt', 'ohp-lgbt',
'libertyboys', 'buck', 'naturalhazardscenter',
'nickcarterweekly', 'ohp-oculina', 'old-cap-collier',
'oldsleuth', 'oracle', 'osterweil', 'oteroycolominas',
'ohp-otisanthony', 'pluckandluck', 'qubit', 'larevista',
'maniscalcor', 'helps-robert', 'robertsonandfresh',
'pagan-shrine', 'sacred-leaves-sympos',
'sacred-leaves-manusc', 'sallybirdhowry', 'watt',
'zylstra', 'scifi', 'secretservice-bradys',
'sfra-newsletter', 'shieldweekly', 'showmens',
'ohp-showmens', 'skip-gandy', 'spanishcivilwar',
'ohp-spanishcivilwar', 'starryflagweekly',
'mvi-stateofwater', 'stokes', 'ohp-sulphursprings',
'suniland', 'sunland-tribune', 'ohp-tampaarts',
'tampabayhistoryjrnl', 'cigars', 'tampailustrado',
'tampa-life', 'ohp-freedman', 'tampanativesshow',
'wpa-papers', 'latinoperiodicals', 't-terrace-sentinel',
'trse', 'tiptopweekly', 'tobaccoleafjournal',
'mvi-tropicalecology', 'tyndalltarget', 'ohp-usf25',
'ohp-usf50', 'usf-archives', 'accent-on-learning',
'cota', 'ohp-csd50th', 'usf-fact-book', 'usf-liblectures',
'ohp-usfhistory', 'usfphotos', 'usf-student-news',
'usfwomen', 'usf-yearbooks', 'cutr', 'jsallen-papers',
'volcanic-lightning', 'darfuridrawings', 'wehman',
'ohp-westcentralfl', 'wide-awake-weekly',
'wildwestweekly', 'yankeedoodle', 'youngklondike',
'youngroughriders']),
'vhlf': DataProvider('vhlf',
'http://dpanther.fiu.edu/sobek/sobekcm_oai.aspx',
'oai_dc',
['hco'])
}
OUT_PATH = '/opt/ssdn/OAI_export/'
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment