import re
import requests
from fake_useragent import UserAgent
url = 'https://www.qidian.com/rank/yuepiao/'
headers = {'User-Agent':UserAgent().chrome}
res = requests.get(url,headers = headers)
res.encoding = 'utf-8'
with open('tmp.html','w',encoding='utf-8') as f:
f.write(res.text)
rs =re.findall('<div class="book-mid-info"> <h2><a href=".+?>(.+)</a>',res.text)
print(rs)
爬的起点网,为什么会爬出来想要的东西后面的那些什么标签什么的呀
