import requests
from fake_useragent import UserAgent
from bs4 import BeautifulSoup
def format_actors(a_list):
actor_set = set()
for a in a_list:
actor_set.add(a.text.strip())
return actor_set
def start():
url = 'https://www.maoyan.com/films/1300821'
headers = {
'User-Agent': UserAgent().opera
}
resp = requests.get(url, headers=headers)
soup = BeautifulSoup(resp.text,'lxml')
name = soup.select('h1.name')[0].text
types = soup.select('h1.ellipsis')[0].text
actors_m = soup.select('li.celebrity.actor>div>a')
actors = format_actors(actors_m)
print(f'电影名:{name} 类型:{types} 演员:{actors}')
if __name__ == '__main__':
start()
## 错误类型
name = soup.select('h1.name')[0].text
IndexError: list index out of range
这是怎么一回事 如何解决啊