Last active
August 16, 2024 20:05
-
-
Save SeungjunNah/b10d369b92840cb8dd2118dd4f41d643 to your computer and use it in GitHub Desktop.
REDS dataset downloading script
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# reference: https://stackoverflow.com/questions/25010369/wget-curl-large-file-from-google-drive | |
import os | |
import requests | |
import argparse | |
def download_file_from_google_drive(id, destination): | |
def get_confirm_token(response): | |
for key, value in response.cookies.items(): | |
if key.startswith('download_warning'): | |
return value | |
return None | |
def save_response_content(response, destination): | |
CHUNK_SIZE = 32768 | |
with open(destination, "wb") as f: | |
for chunk in response.iter_content(CHUNK_SIZE): | |
if chunk: # filter out keep-alive new chunks | |
f.write(chunk) | |
URL = "https://docs.google.com/uc?export=download" | |
session = requests.Session() | |
response = session.get(URL, params = {'id': id}, stream=True) | |
token = get_confirm_token(response) | |
if token: | |
params = {'id' : id, 'confirm' : token} | |
response = session.get(URL, params=params, stream=True) | |
save_response_content(response, destination) | |
def download_file_from_server(server, subset, destination): | |
def get_confirm_token(response): | |
for key, value in response.cookies.items(): | |
if key.startswith('download_warning'): | |
return value | |
return None | |
def save_response_content(response, destination): | |
CHUNK_SIZE = 32768 | |
with open(destination, "wb") as f: | |
for chunk in response.iter_content(CHUNK_SIZE): | |
if chunk: # filter out keep-alive new chunks | |
f.write(chunk) | |
session = requests.Session() | |
if server == 'google': | |
URL = "https://docs.google.com/uc?export=download" | |
params = {'id': ids[subset]} | |
elif server == 'snu': | |
URL = 'http://data.cv.snu.ac.kr:8008/webdav/dataset/REDS/' + subset + '.zip' | |
params = {} | |
response = session.get(URL, params=params, stream=True) | |
token = get_confirm_token(response) | |
if token: | |
params['confirm'] = token | |
response = session.get(URL, params=params, stream=True) | |
save_response_content(response, destination) | |
parser = argparse.ArgumentParser(description='Download REDS dataset from google drive to current folder', allow_abbrev=False) | |
parser.add_argument('--server', type=str, default='snu', choices=('google', 'snu'), help='download server choice.') | |
parser.add_argument('--all', action='store_true', help='download full REDS dataset') | |
parser.add_argument('--train_sharp', action='store_true', help='download train_sharp.zip') | |
parser.add_argument('--train_blur', action='store_true', help='download train_blur.zip') | |
parser.add_argument('--train_blur_comp', action='store_true', help='download train_blur_comp.zip') | |
parser.add_argument('--train_sharp_bicubic', action='store_true', help='download train_sharp_bicubic.zip') | |
parser.add_argument('--train_blur_bicubic', action='store_true', help='download train_blur_bicubic.zip') | |
parser.add_argument('--val_sharp', action='store_true', help='download val_sharp.zip') | |
parser.add_argument('--val_blur', action='store_true', help='download val_blur.zip') | |
parser.add_argument('--val_blur_comp', action='store_true', help='download val_blur_comp.zip') | |
parser.add_argument('--val_sharp_bicubic', action='store_true', help='download val_sharp_bicubic.zip') | |
parser.add_argument('--val_blur_bicubic', action='store_true', help='download val_blur_bicubic.zip') | |
parser.add_argument('--test_blur', action='store_true', help='download test_blur.zip') | |
parser.add_argument('--test_blur_comp', action='store_true', help='download test_blur_comp.zip') | |
parser.add_argument('--test_sharp_bicubic', action='store_true', help='download test_sharp_bicubic.zip') | |
parser.add_argument('--test_blur_bicubic', action='store_true', help='download test_blur_bicubic.zip') | |
args = parser.parse_args() | |
ids = { 'train_sharp': '1YLksKtMhd2mWyVSkvhDaDLWSc1qYNCz-', | |
'train_blur': '1Be2cgzuuXibcqAuJekDgvHq4MLYkCgR8', | |
'train_blur_comp': '1hi6348BB9QQFqVx2PY7pKn32HQM89CJ1', | |
'train_sharp_bicubic': '1a4PrjqT-hShvY9IyJm3sPF0ZaXyrCozR', | |
'train_blur_bicubic': '10u8gthv2Q95RMCb1LeCN8N4ozB8TVjMt', | |
'val_sharp': '1MGeObVQ1-Z29f-myDP7-8c3u0_xECKXq', | |
'val_blur': '1N8z2yD0GDWmh6U4d4EADERtcUgDzGrHx', | |
'val_blur_comp': '13d1uzqLdbsQzeZkWgdF5QVHqDSjfE4zZ', | |
'val_sharp_bicubic': '1sChhtzN9Css10gX7Xsmc2JaC-2Pzco6a', | |
'val_blur_bicubic': '1i3NAb7EmF4fCYadGaHK54-Zgx9lIC2Gp', | |
'test_blur': '1dr0--ZBKqr4P1M8lek6JKD1Vd6bhhrZT', | |
'test_blur_comp': '1OctyKR3ER_YWrZxKxQsZzLis3BvLSOFO', | |
'test_sharp_bicubic': '1y0Jle6xB41TdRK_QMJ_E8W_iBMxwq_Rh', | |
'test_blur_bicubic': '14YszfzUAeAfwP0ZA2FRzAiVxxZLg7-tY', | |
} | |
# Download files in REDS directory | |
if os.path.basename(os.getcwd()) == 'REDS': | |
root_dir = '.' | |
else: | |
os.makedirs('REDS', exist_ok=True) | |
root_dir = 'REDS' | |
for subset in ids: | |
argdict = args.__dict__ | |
if args.all or argdict[subset]: | |
filename = '{}/{}.zip'.format(root_dir, subset) | |
servername = 'Google Drive' if args.server == 'google' else 'SNU CVLab' | |
print('Downloading {}.zip from {}'.format(subset, servername)) | |
download_file_from_server(args.server, subset, filename) # download the designated subset |
@wangruohui The file size warning message is normal and you are good to proceed.
The download script failure is less likely to be related to that. Download script may fail due to the traffic limit set by Google Drive when there are many download requests. Please try again later and if you have further issues, please send me an email.
Hi @SeungjunNah is it possible to release test_sharp.zip
, now that the challenge has been over for 5 years?
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Hello,
It seems direct downloading from google server results to a webpage instead of the file itself, which warns you that the file is so large that google cannot scan it for virus. If I download manually from the browser, a further confirmation is required to download the zip file itself. But this script does not further handle this.
As shown below, this script actually downloads this webpage.