sithart/bioinformatics_keywords_scraping.py

## bioinformatics_keywords_scraping.py
import requests
from bs4 import BeautifulSoup
import json
import csv


import pandas as pd
res = requests.get("https://mipt.ru/dbmp/student/files/bioinformatics/books/glossary_bioinf.php")
soup = BeautifulSoup(res.text, "html.parser")
keys = []
values =[]

for data in soup.find_all("span", attrs ={"class":"entry"}):
    key = data.get_text()
    val = data.parent.parent
    keys.append(key)
    values.append(val.get_text().replace(key, '').replace('\n', ''))
print(len(values))
print(len(keys))

dictionary = dict(zip(keys, values))
with open('Glossary_of_info.txt', 'w') as json_file:
    json.dump(dictionary, json_file, indent=4)
	import requests
	from bs4 import BeautifulSoup
	import json
	import csv


	import pandas as pd
	res = requests.get("https://mipt.ru/dbmp/student/files/bioinformatics/books/glossary_bioinf.php")
	soup = BeautifulSoup(res.text, "html.parser")
	keys = []
	values =[]

	for data in soup.find_all("span", attrs ={"class":"entry"}):
	key = data.get_text()
	val = data.parent.parent
	keys.append(key)
	values.append(val.get_text().replace(key, '').replace('\n', ''))
	print(len(values))
	print(len(keys))

	dictionary = dict(zip(keys, values))
	with open('Glossary_of_info.txt', 'w') as json_file:
	json.dump(dictionary, json_file, indent=4)