phaneesh/sync-ifsc.py

## sync-ifsc.py
from __future__ import print_function
import requests
from bs4 import BeautifulSoup
import xlrd
import shutil
import os
import codecs

page = requests.get("https://www.rbi.org.in/Scripts/bs_viewcontent.aspx?Id=2009")

soup = BeautifulSoup(page.content, 'html.parser')

ifsc_table = soup.find_all('table', class_='tablebg')[0]

ifsc_links = ifsc_table.find_all('a')


def download_file(url):
    local_filename = url.split('/')[-1]
    print("Downloading file: " + url + " | File Name: " + local_filename)
    r = requests.get(url.replace("http:", "https:"), stream=True)
    with open(local_filename, 'wb') as f:
        shutil.copyfileobj(r.raw, f)

    return local_filename


full_file = codecs.open("all_ifsc.csv", "wb", "utf-8")
error_file = codecs.open("all_ifsc_errors.txt", "wb", "utf-8")

for link in ifsc_links:
    file_path = download_file(link['href'])
    xl = xlrd.open_workbook(file_path)
    df = xl.sheet_by_index(0)
    for row in range(1, df.nrows):
        values = []
        try:
            for c in range(df.ncols):
                values.append(unicode(df.cell_value(row, c)))
            print(",".join(values))
            print(",".join(values), file=full_file)
        except:
            print(df.row(row))
            print(df.row(row), file=error_file)
    os.remove(file_path)

full_file.close()
error_file.close()
	from __future__ import print_function
	import requests
	from bs4 import BeautifulSoup
	import xlrd
	import shutil
	import os
	import codecs

	page = requests.get("https://www.rbi.org.in/Scripts/bs_viewcontent.aspx?Id=2009")

	soup = BeautifulSoup(page.content, 'html.parser')

	ifsc_table = soup.find_all('table', class_='tablebg')[0]

	ifsc_links = ifsc_table.find_all('a')


	def download_file(url):
	local_filename = url.split('/')[-1]
	print("Downloading file: " + url + " \| File Name: " + local_filename)
	r = requests.get(url.replace("http:", "https:"), stream=True)
	with open(local_filename, 'wb') as f:
	shutil.copyfileobj(r.raw, f)

	return local_filename


	full_file = codecs.open("all_ifsc.csv", "wb", "utf-8")
	error_file = codecs.open("all_ifsc_errors.txt", "wb", "utf-8")

	for link in ifsc_links:
	file_path = download_file(link['href'])
	xl = xlrd.open_workbook(file_path)
	df = xl.sheet_by_index(0)
	for row in range(1, df.nrows):
	values = []
	try:
	for c in range(df.ncols):
	values.append(unicode(df.cell_value(row, c)))
	print(",".join(values))
	print(",".join(values), file=full_file)
	except:
	print(df.row(row))
	print(df.row(row), file=error_file)
	os.remove(file_path)

	full_file.close()
	error_file.close()