爬取豆瓣top250
爬取豆瓣top250 电影名称 评分和评价人数
import requests from bs4 import BeautifulSoup def func(ur): resp = requests.get(url,headers={ "User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/78.0.3904.108 Safari/537.36" }) main_page = BeautifulSoup(resp.text, "html.parser") ol = main_page.find("ol", attrs={"class": "grid_view"}) lst = ol.find_all("li") for li in lst: name = li.find("div",attrs={"class":"hd"}).find("span",attrs={"class":"title"}).text score = li.find("span", attrs={"class": "rating_num"}).text evaluate = li.find("div",attrs={"class":"star"}).find_all("span")[-1].text print(name,score,evaluate) for i in range(10): url = f"https://movie.douban.com/top250?start={i*25}&filter=" func(url)
运行后打印截图: