abearxiong/readme.md

## readme.md

      
    Raw
  

              readme.md
            
          
    copy from https://github.com/arry-lee/wereader

  
## weread.py
import os.path
from collections import defaultdict, namedtuple
from itertools import chain
from operator import attrgetter

import requests

requests.packages.urllib3.disable_warnings()

Book = namedtuple("Book", ["bookId", "title", "author", "cover"])

headers = """
Host: i.weread.qq.com
Connection: keep-alive
Upgrade-Insecure-Requests: 1
User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.103 Safari/537.36
Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3
Accept-Encoding: gzip, deflate, br
Accept-Language: zh-CN,zh;q=0.9,en;q=0.8
"""
headers = dict(x.split(": ", 1) for x in headers.splitlines() if x)


def get_bookmarklist(bookId, cookies):
    """获取某本书的笔记返回md文本"""
    url = "https://i.weread.qq.com/book/bookmarklist"
    params = dict(bookId=bookId)
    r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)

    if r.ok:
        data = r.json()
    else:
        raise Exception(r.text)
    chapters = {c["chapterUid"]: c["title"] for c in data["chapters"]}
    contents = defaultdict(list)

    for item in sorted(data["updated"], key=lambda x: x["chapterUid"]):
        chapter = item["chapterUid"]
        text = item["markText"]
        create_time = item["createTime"]
        start = int(item["range"].split("-")[0])
        contents[chapter].append((start, text))

    chapters_map = {title: level for level, title in get_chapters(int(bookId), cookies)}
    res = ""
    for c in sorted(chapters.keys()):
        title = chapters[c]
        res += "#" * chapters_map[title] + " " + title + "\n"
        for start, text in sorted(contents[c], key=lambda e: e[0]):
            res += "> " + text.strip() + "\n\n"
        res += "\n"

    return res


def get_bestbookmarks(bookId, cookies):
    """获取书籍的热门划线,返回文本"""
    url = "https://i.weread.qq.com/book/bestbookmarks"
    params = dict(bookId=bookId)
    r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)
    if r.ok:
        data = r.json()
    else:
        raise Exception(r.text)
    chapters = {c["chapterUid"]: c["title"] for c in data["chapters"]}
    contents = defaultdict(list)
    for item in data["items"]:
        chapter = item["chapterUid"]
        text = item["markText"]
        contents[chapter].append(text)

    chapters_map = {title: level for level, title in get_chapters(int(bookId), cookies)}
    res = ""
    for c in chapters:
        title = chapters[c]
        res += "#" * chapters_map[title] + " " + title + "\n"
        for text in contents[c]:
            res += "> " + text.strip() + "\n\n"
        res += "\n"
    return res


def get_chapters(bookId, cookies):
    """获取书的目录"""
    url = "https://i.weread.qq.com/book/chapterInfos"
    data = '{"bookIds":["%d"],"synckeys":[0]}' % bookId

    r = requests.post(url, data=data, headers=headers, cookies=cookies, verify=False)

    if r.ok:
        data = r.json()
        # clipboard.copy(json.dumps(data, indent=4, sort_keys=True))
    else:
        raise Exception(r.text)

    chapters = []
    for item in data["data"][0]["updated"]:
        if "anchors" in item:
            chapters.append((item.get("level", 1), item["title"]))
            for ac in item["anchors"]:
                chapters.append((ac["level"], ac["title"]))

        elif "level" in item:
            chapters.append((item.get("level", 1), item["title"]))

        else:
            chapters.append((1, item["title"]))

    return chapters


def get_bookinfo(bookId, cookies):
    """获取书的详情"""
    url = "https://i.weread.qq.com/book/info"
    params = dict(bookId=bookId)
    r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)

    if r.ok:
        data = r.json()
    else:
        raise Exception(r.text)
    return data


def get_bookshelf(cookies):
    """获取书架上所有书"""
    url = "https://i.weread.qq.com/shelf/friendCommon"
    userVid = cookies.get("wr_vid")
    params = dict(userVid=userVid)
    r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)
    if r.ok:
        data = r.json()
    else:
        raise Exception(r.text)
    books = set()
    for book in chain(data["finishReadBooks"], data["recentBooks"]):
        if not book["bookId"].isdigit():  # 过滤公众号
            continue
        try:
            b = Book(book["bookId"], book["title"], book["author"], book["cover"])
            books.add(b)
        except Exception as e:
            pass

    books = list(books)
    books.sort(key=attrgetter("title"))

    return books


def get_notebooklist(cookies):
    """获取笔记本列表"""
    url = "https://i.weread.qq.com/user/notebooks"
    r = requests.get(url, headers=headers, cookies=cookies, verify=False)

    if r.ok:
        data = r.json()
    else:
        raise Exception(r.text)
    books = []
    for b in data["books"]:
        book = b["book"]
        b = Book(book["bookId"], book["title"], book["author"], book["cover"])
        books.append(b)
    books.sort(key=attrgetter("title"))
    return books


def get_bookcover(book,output_dir=None):
    headers = {
        'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9',
        'accept-encoding': 'gzip, deflate, br',
        'accept-language': 'zh-CN,zh;q=0.9',
        'cache-control': 'max-age=0',
        'if-modified-since': 'Thu, 01 Nov 2018 11:45:36 GMT',
        'if-none-match': 'd52c44c46328acfc2e0bd6f4b444f9f03e2a5be2',
        'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="96", "Google Chrome";v="96"',
        'sec-ch-ua-mobile': '?0',
        'sec-ch-ua-platform': '"Windows"',
        'sec-fetch-dest': 'document',
        'sec-fetch-mode': 'navigate',
        'sec-fetch-site': 'none',
        'sec-fetch-user': '?1',
        'upgrade-insecure-requests': '1',
        'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36'
    }

    url = 'b'.join(book.cover.rsplit('s',1))
    r = requests.get(url, headers=headers, verify=False)
    print(r)
    if r.ok:
        data = r.content
    else:
        raise Exception(r.text)

    if output_dir is None:
        output_dir = os.path.abspath(os.path.dirname(__file__))

    path = os.path.join(output_dir, str(book.bookId) + '.jpg')
    print(path)
    with open(path,'wb') as f:
        f.write(data)

if __name__ == '__main__':
    b = Book(622114,'','',"https://wfqqreader-1252317822.image.myqcloud.com/cover/114/622114/s_622114.jpg")
    get_bookcover(b)
	import os.path
	from collections import defaultdict, namedtuple
	from itertools import chain
	from operator import attrgetter

	import requests

	requests.packages.urllib3.disable_warnings()

	Book = namedtuple("Book", ["bookId", "title", "author", "cover"])

	headers = """
	Host: i.weread.qq.com
	Connection: keep-alive
	Upgrade-Insecure-Requests: 1
	User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.103 Safari/537.36
	Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,/;q=0.8,application/signed-exchange;v=b3
	Accept-Encoding: gzip, deflate, br
	Accept-Language: zh-CN,zh;q=0.9,en;q=0.8
	"""
	headers = dict(x.split(": ", 1) for x in headers.splitlines() if x)


	def get_bookmarklist(bookId, cookies):
	"""获取某本书的笔记返回md文本"""
	url = "https://i.weread.qq.com/book/bookmarklist"
	params = dict(bookId=bookId)
	r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)

	if r.ok:
	data = r.json()
	else:
	raise Exception(r.text)
	chapters = {c["chapterUid"]: c["title"] for c in data["chapters"]}
	contents = defaultdict(list)

	for item in sorted(data["updated"], key=lambda x: x["chapterUid"]):
	chapter = item["chapterUid"]
	text = item["markText"]
	create_time = item["createTime"]
	start = int(item["range"].split("-")[0])
	contents[chapter].append((start, text))

	chapters_map = {title: level for level, title in get_chapters(int(bookId), cookies)}
	res = ""
	for c in sorted(chapters.keys()):
	title = chapters[c]
	res += "#" * chapters_map[title] + " " + title + "\n"
	for start, text in sorted(contents[c], key=lambda e: e[0]):
	res += "> " + text.strip() + "\n\n"
	res += "\n"

	return res


	def get_bestbookmarks(bookId, cookies):
	"""获取书籍的热门划线,返回文本"""
	url = "https://i.weread.qq.com/book/bestbookmarks"
	params = dict(bookId=bookId)
	r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)
	if r.ok:
	data = r.json()
	else:
	raise Exception(r.text)
	chapters = {c["chapterUid"]: c["title"] for c in data["chapters"]}
	contents = defaultdict(list)
	for item in data["items"]:
	chapter = item["chapterUid"]
	text = item["markText"]
	contents[chapter].append(text)

	chapters_map = {title: level for level, title in get_chapters(int(bookId), cookies)}
	res = ""
	for c in chapters:
	title = chapters[c]
	res += "#" * chapters_map[title] + " " + title + "\n"
	for text in contents[c]:
	res += "> " + text.strip() + "\n\n"
	res += "\n"
	return res


	def get_chapters(bookId, cookies):
	"""获取书的目录"""
	url = "https://i.weread.qq.com/book/chapterInfos"
	data = '{"bookIds":["%d"],"synckeys":[0]}' % bookId

	r = requests.post(url, data=data, headers=headers, cookies=cookies, verify=False)

	if r.ok:
	data = r.json()
	# clipboard.copy(json.dumps(data, indent=4, sort_keys=True))
	else:
	raise Exception(r.text)

	chapters = []
	for item in data["data"][0]["updated"]:
	if "anchors" in item:
	chapters.append((item.get("level", 1), item["title"]))
	for ac in item["anchors"]:
	chapters.append((ac["level"], ac["title"]))

	elif "level" in item:
	chapters.append((item.get("level", 1), item["title"]))

	else:
	chapters.append((1, item["title"]))

	return chapters


	def get_bookinfo(bookId, cookies):
	"""获取书的详情"""
	url = "https://i.weread.qq.com/book/info"
	params = dict(bookId=bookId)
	r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)

	if r.ok:
	data = r.json()
	else:
	raise Exception(r.text)
	return data


	def get_bookshelf(cookies):
	"""获取书架上所有书"""
	url = "https://i.weread.qq.com/shelf/friendCommon"
	userVid = cookies.get("wr_vid")
	params = dict(userVid=userVid)
	r = requests.get(url, params=params, headers=headers, cookies=cookies, verify=False)
	if r.ok:
	data = r.json()
	else:
	raise Exception(r.text)
	books = set()
	for book in chain(data["finishReadBooks"], data["recentBooks"]):
	if not book["bookId"].isdigit(): # 过滤公众号
	continue
	try:
	b = Book(book["bookId"], book["title"], book["author"], book["cover"])
	books.add(b)
	except Exception as e:
	pass

	books = list(books)
	books.sort(key=attrgetter("title"))

	return books


	def get_notebooklist(cookies):
	"""获取笔记本列表"""
	url = "https://i.weread.qq.com/user/notebooks"
	r = requests.get(url, headers=headers, cookies=cookies, verify=False)

	if r.ok:
	data = r.json()
	else:
	raise Exception(r.text)
	books = []
	for b in data["books"]:
	book = b["book"]
	b = Book(book["bookId"], book["title"], book["author"], book["cover"])
	books.append(b)
	books.sort(key=attrgetter("title"))
	return books


	def get_bookcover(book,output_dir=None):
	headers = {
	'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,/;q=0.8,application/signed-exchange;v=b3;q=0.9',
	'accept-encoding': 'gzip, deflate, br',
	'accept-language': 'zh-CN,zh;q=0.9',
	'cache-control': 'max-age=0',
	'if-modified-since': 'Thu, 01 Nov 2018 11:45:36 GMT',
	'if-none-match': 'd52c44c46328acfc2e0bd6f4b444f9f03e2a5be2',
	'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="96", "Google Chrome";v="96"',
	'sec-ch-ua-mobile': '?0',
	'sec-ch-ua-platform': '"Windows"',
	'sec-fetch-dest': 'document',
	'sec-fetch-mode': 'navigate',
	'sec-fetch-site': 'none',
	'sec-fetch-user': '?1',
	'upgrade-insecure-requests': '1',
	'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36'
	}

	url = 'b'.join(book.cover.rsplit('s',1))
	r = requests.get(url, headers=headers, verify=False)
	print(r)
	if r.ok:
	data = r.content
	else:
	raise Exception(r.text)

	if output_dir is None:
	output_dir = os.path.abspath(os.path.dirname(__file__))

	path = os.path.join(output_dir, str(book.bookId) + '.jpg')
	print(path)
	with open(path,'wb') as f:
	f.write(data)

	if __name__ == '__main__':
	b = Book(622114,'','',"https://wfqqreader-1252317822.image.myqcloud.com/cover/114/622114/s_622114.jpg")
	get_bookcover(b)