asukaminato0721/douban_crawel.py

## douban_crawel.py
from typing import List

import requests
from lxml.etree import HTML

headers = {
    "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:95.0) Gecko/20100101 Firefox/95.0",
}

params = (
    ("start", "75"),  # ["0", "25", "50", "75"]
    ("sort", "seq"),
    ("playable", "0"),
    ("sub_type", ""),
)

response = requests.get(
    "https://www.douban.com/doulist/968362/",
    headers=headers,
    params=params,
)
html = HTML(response.text)
result: List[str] = html.xpath("//div[@class='title']/a/text()")
for i in result:
    i = i.strip()
    if i:
        print(i)
	from typing import List

	import requests
	from lxml.etree import HTML

	headers = {
	"User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:95.0) Gecko/20100101 Firefox/95.0",
	}

	params = (
	("start", "75"), # ["0", "25", "50", "75"]
	("sort", "seq"),
	("playable", "0"),
	("sub_type", ""),
	)

	response = requests.get(
	"https://www.douban.com/doulist/968362/",
	headers=headers,
	params=params,
	)
	html = HTML(response.text)
	result: List[str] = html.xpath("//div[@class='title']/a/text()")
	for i in result:
	i = i.strip()
	if i:
	print(i)