01步获取网页信息

from urllib.request import urlopen, Request
from lxml import etree
#构造函数,抓取第i页信息

    #  构造第i页的网址

url = 'https://movie.douban.com/top250?start=%s&filter='
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36'}
ret = Request(url, headers=headers)
res = urlopen(ret)
aa = res.read().decode('utf-8')
print(aa)

https://blog.csdn.net/sinat_37812785/article/details/104247874

猜你喜欢

转载自blog.csdn.net/jidawanghao/article/details/108375845
今日推荐