Skip to content

Instantly share code, notes, and snippets.

@modalsoul
Created November 5, 2018 16:12
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save modalsoul/2b9b7be886d7999f0b36cb9082029e84 to your computer and use it in GitHub Desktop.
Save modalsoul/2b9b7be886d7999f0b36cb9082029e84 to your computer and use it in GitHub Desktop.
import time
from selenium import webdriver
URL = 'https://www.post.japanpost.jp/zipcode/dl/oogaki-zip.html'
DOWNLOAD_PATH = '/opt/app/scraping/dst'
def enable_download_in_headless_chrome(driver, download_dir):
driver.command_executor._commands["send_command"] = ("POST", '/session/$sessionId/chromium/send_command')
params = {'cmd': 'Page.setDownloadBehavior', 'params': {'behavior': 'allow', 'downloadPath': download_dir}}
driver.execute("send_command", params)
def main():
options = webdriver.ChromeOptions()
options.add_argument('--headless')
options.add_argument('--no-sandbox')
prefs = {"download.default_directory": DOWNLOAD_PATH, "download.prompt_for_download": False}
options.add_experimental_option("prefs", prefs)
driver = webdriver.Chrome(chrome_options=options)
enable_download_in_headless_chrome(driver, DOWNLOAD_PATH)
driver.get(URL)
driver.execute_script("document.getElementsByTagName('a')[27].click()")
time.sleep(3)
driver.close()
driver.quit()
main()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment