Skip to content

Instantly share code, notes, and snippets.

Created April 5, 2023 12:54
Show Gist options
  • Save melihme/cb5769c8b9683ff5a1b6849c56adbdc6 to your computer and use it in GitHub Desktop.
Save melihme/cb5769c8b9683ff5a1b6849c56adbdc6 to your computer and use it in GitHub Desktop.
Kandilli Deprem Verisi İndirme
import os
import multiprocessing
from time import sleep
import requests
download_path = "./data5"
start_year = 2013
end_year = 2023 # partial data will occur if the year has not yet ends
years = range(start_year, end_year + 1)
months = range(1, 13)
if not os.path.exists(download_path):
urls = []
for y in years:
for m in months:
url_tpl = f"{y}{m:02}.xml"
def download(url: str, base_path="."):
response = requests.get(url)
rfile = url.split("/")[-1]
file_name = os.path.join(base_path, rfile)
if response.status_code != 200:
print(f"{_url} returns {response.status_code}")
return "Download failed"
with open(file_name, "w") as f:
print(f"{_url} is downloaded")
return "Download successful"
except Exception as e:
queue = multiprocessing.Queue(maxsize=5)
while True:
if not queue.full():
if not urls:
print("All urls are downloaded!")
_url = urls.pop()
print(f"{_url} is added to queue.")
queue.put(download(_url, download_path))
print("Queue is full, wait for 5 secs.")
while not queue.empty():
result = queue.get()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment