Python 豆瓣爬虫

'''
Python 豆瓣爬虫 by 郑瑞国
'''
import re
import urllib.request 

def open_url(url):
    return urllib.request.urlopen(url).read().decode("utf-8","ignore")

def find_text(url):
    return re.findall('<div class="name">(.*?)</div>',open_url(url))

def save_text(text):
    with open(r'd:\test.txt','a') as f:
        for i in range(0,len(text)):
            f.write(text[i]+"\n")

if __name__ == "__main__":
    url = 'https://read.douban.com/provider/all'
    text = find_text(url)
    save_text(text)

猜你喜欢

转载自blog.csdn.net/zheng_ruiguo/article/details/85066414