python编写豆瓣爬虫top100电影榜单
import urllib.request import re headers ={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.141 Safari/537.36" } url="https://movie.douban.com/j/chart/top_list?type=11&interval_id=100%3A90&action=&start=0&limit=100" req=urllib.request.Request(url,headers=headers) data=urllib.request.urlopen(req).read().decode() pat1=r'"rating":\["(.*?)","\d+"\]' pat2=r'"title":"(.*?)"' pettern1=re.compile(pat1) pettern2=re.compile(pat2) data1=pettern1.findall(data) data2=pettern2.findall(data) for x in range(len(data1)): print("排名:",x+1,"电影名:",data2[x],"豆瓣评分:",data1[x])
<< 上一篇