- import requests
- from bs4 import BeautifulSoup
- headers={
- "User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/117.0.0.0 Safari/537.36 Edg/117.0.2045.36"
- }
- for start_num in range(0,250,25):
- response =requests.get(f"https://movie.douban.com/top250?start={start_num}",headers=headers)
- html=response.text
- soup=BeautifulSoup(html,"html.parser")
- all_titles=soup.findAll("span",attrs={"class":"title"})
- for titles in all_titles:
- if titles.string[1]!="/":
- print(titles.string)