'''
Python 豆瓣爬虫 by 郑瑞国
'''
import re
import urllib.request
def open_url(url):
return urllib.request.urlopen(url).read().decode("utf-8","ignore")
def find_text(url):
return re.findall('<div class="name">(.*?)</div>',open_url(url))
def save_text(text):
with open(r'd:\test.txt','a') as f:
for i in range(0,len(text)):
f.write(text[i]+"\n")
if __name__ == "__main__":
url = 'https://read.douban.com/provider/all'
text = find_text(url)
save_text(text)
Python 豆瓣爬虫
猜你喜欢
转载自blog.csdn.net/zheng_ruiguo/article/details/85066414
今日推荐
周排行