Skip to content

Instantly share code, notes, and snippets.

View clarissarjtai's full-sized avatar
🎯
Focusing

Clarissa RJ Tai clarissarjtai

🎯
Focusing
View GitHub Profile
@clarissarjtai
clarissarjtai / Selenium Python-2.py
Created October 6, 2020 10:33
Selenium in Python Tutorial-2
from selenium import webdriver
from selenium.webdriver.common.by import By
# 透過Browser Driver 開啟 Chrome
driver = webdriver.Chrome(r"C:\Clarissa\文章\程式碼\Selenium\chromedriver")
# 前往特定網址
default_url = "https://www.google.com.tw"
driver.get(default_url)
# 獲取目前網頁url
driver.current_url
@clarissarjtai
clarissarjtai / Instagram Image&Video.py
Last active September 27, 2023 08:06
Getting all image and video urls from an Instagram post.
import time
from selenium import webdriver
from bs4 import BeautifulSoup as Soup
from selenium.webdriver.common.by import By
from selenium.webdriver.support.wait import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
media_url = []
count = 0 # 目前獲得圖片連結數
soup = Soup(browser.page_source,"lxml")
@clarissarjtai
clarissarjtai / Instagram Post Time.py
Last active September 19, 2020 03:02
Getting Instagram Post Time.
from selenium import webdriver
from bs4 import BeautifulSoup as Soup
browser = webdriver.Chrome()
url = 'https://www.instagram.com/p/CEYqVrtp1HA/'
browser.get(url)
soup = Soup(browser.page_source,"lxml") # 抓取網頁原始碼
arti = soup.article # find article標籤內容
post_time = arti.find(class_ = "_1o9PC Nzb55").get('datetime') # 抓取特定classname裡的datetime標籤
print(post_time)