1234567891011121314151617181920212223242526 |
- import requests
- import re
- def get_article_links():
- article = requests.get(
- "https://www.xuexi.cn/c06bf4acc7eef6ef0a560328938b5771/data9a3668c13f6e303932b5e0e100fc248b.js").content.decode(
- "utf8")
- pattern = r"list\"\:(.+),\"count\"\:"
- links = []
- list = eval(re.search(pattern, article).group(1))[:20000]
- list.reverse()
- for i in range(len(list)):
- links.append(list[i]["static_page_url"])
- return links
- def get_video_links():
- video = requests.get(
- "https://www.xuexi.cn/4426aa87b0b64ac671c96379a3a8bd26/datadb086044562a57b441c24f2af1c8e101.js").content.decode(
- "utf8")
- pattern = r'https://www.xuexi.cn/[^,"]*html'
- link = re.findall(pattern, video, re.I)
- link.reverse()
- return link
|