爬取校花网美眉图

#Author:Elson Zeng
import os
import requests
import re


# http://www.xiaohuar.com/list-1-1.html
# http://www.xiaohuar.com/list-1-2.html

#mg width="210" alt="台湾朝阳科技大学校花陈静怡" src="/d/file/20181113/f957a341bd5ff1dd62641494ce6db464.jpg">
urls = 'http://www.xiaohuar.com/list-1-%s.html'
path = 'C:/Users/JIAN/Desktop/python_dowload/'+ 'MM' + '/'

for i in range(1000):
temp = urls %i
response = requests.get(temp)
html = response.text
girl_urls = re.findall(r'/d/file/\d+/\w+\.jpg',html)
#girl_name = re.findall(r'/d/file/\d+/\w+\.jpg', html)

for girl_url in girl_urls:
img_url = requests.get('http://www.xiaohuar.com'+ girl_url)
img_data = img_url.content
girl_name = girl_url.split('/')[-1]
girl_path = path + girl_name
if not os.path.exists(path):
os.mkdir(path)
if not os.path.exists(girl_path):
with open(girl_path,'wb') as f:
f.write(img_data)

猜你喜欢

转载自www.cnblogs.com/elson-zeng/p/10808121.html
今日推荐