NbtKmy/check_gnd.py

## check_gnd.py
import pandas as pd
import requests

df = pd.read_csv('snf_person.csv', sep=',')

df['viaf'] = 'NaN'
df['orcid_gnd'] = 'NaN'
df['gnd'] = 'NaN'
df['ambiguity'] = 0


df1 = df[:100]

for index, row in df1.iterrows():
    last_name = row[0]
    first_name = row[1]
    inst = row[3]
    orcid = row[6]

    comma = str(', ')
    name = str(last_name) + comma + str(first_name)

    gnd_prefix = 'https://lobid.org/gnd/search?q='
    gnd_suffix = '&filter=type:Person&format=json'
    gnd_url = gnd_prefix + name + gnd_suffix

    req = requests.get(gnd_url)
    gnd_dat = req.json()

    if not gnd_dat:
        pass
    else:
        if gnd_dat['totalItems'] > 1:
            for pers in gnd_dat['member']:

                if 'affiliation' in pers:
                    for affis in pers['affiliation']:
                        if affis['label'] == inst:
                            df1.at[index, 'gnd'] = pers['id']

                            if 'sameAs' in pers:
                                for other_ent in pers['sameAs']:
                                    if other_ent['collection']['id'] == 'http://www.wikidata.org/entity/Q54919':
                                        df1.at[index, 'viaf'] = other_ent['id']
                                    elif other_ent['collection']['id'] == 'https://orcid.org':
                                        df1.at[index, 'orcid_gnd'] = other_ent['id']
                                    else:
                                        pass
                                else:
                                    pass
                            else:
                                pass
        elif gnd_dat['totalItems'] == 1:
            pers = gnd_dat['member']

            df1.at[index, 'gnd'] = pers[0]['id']
            df1.at[index, 'ambiguity'] = 50

            if 'affiliation' in pers:
                for affis in pers[0]['affiliation']:
                    df1.at[index, 'Institute Name'] += affis['label']

            if 'sameAs' in pers:
                for other_ent in pers[0]['sameAs']:
                    if other_ent['collection']['id'] == 'http://www.wikidata.org/entity/Q54919':
                        df1.at[index, 'viaf'] = other_ent['id']
                    elif other_ent['collection']['id'] == 'https://orcid.org':
                        df1.at[index, 'orcid_gnd'] = other_ent['id']
                    else:
                        pass
            else:
                pass

df1.to_csv('snf_checkedGND.csv')
	import pandas as pd
	import requests

	df = pd.read_csv('snf_person.csv', sep=',')

	df['viaf'] = 'NaN'
	df['orcid_gnd'] = 'NaN'
	df['gnd'] = 'NaN'
	df['ambiguity'] = 0


	df1 = df[:100]

	for index, row in df1.iterrows():
	last_name = row[0]
	first_name = row[1]
	inst = row[3]
	orcid = row[6]

	comma = str(', ')
	name = str(last_name) + comma + str(first_name)

	gnd_prefix = 'https://lobid.org/gnd/search?q='
	gnd_suffix = '&filter=type:Person&format=json'
	gnd_url = gnd_prefix + name + gnd_suffix

	req = requests.get(gnd_url)
	gnd_dat = req.json()

	if not gnd_dat:
	pass
	else:
	if gnd_dat['totalItems'] > 1:
	for pers in gnd_dat['member']:

	if 'affiliation' in pers:
	for affis in pers['affiliation']:
	if affis['label'] == inst:
	df1.at[index, 'gnd'] = pers['id']

	if 'sameAs' in pers:
	for other_ent in pers['sameAs']:
	if other_ent['collection']['id'] == 'http://www.wikidata.org/entity/Q54919':
	df1.at[index, 'viaf'] = other_ent['id']
	elif other_ent['collection']['id'] == 'https://orcid.org':
	df1.at[index, 'orcid_gnd'] = other_ent['id']
	else:
	pass
	else:
	pass
	else:
	pass
	elif gnd_dat['totalItems'] == 1:
	pers = gnd_dat['member']

	df1.at[index, 'gnd'] = pers[0]['id']
	df1.at[index, 'ambiguity'] = 50

	if 'affiliation' in pers:
	for affis in pers[0]['affiliation']:
	df1.at[index, 'Institute Name'] += affis['label']

	if 'sameAs' in pers:
	for other_ent in pers[0]['sameAs']:
	if other_ent['collection']['id'] == 'http://www.wikidata.org/entity/Q54919':
	df1.at[index, 'viaf'] = other_ent['id']
	elif other_ent['collection']['id'] == 'https://orcid.org':
	df1.at[index, 'orcid_gnd'] = other_ent['id']
	else:
	pass
	else:
	pass

	df1.to_csv('snf_checkedGND.csv')