python爬虫30秒爬取1000张妹子图

目标网站 煎蛋网妹子图

直接贴代码

#coding=gbk
headers = {'User-Agent':"Mozilla/5.0 (Windows NT 6.3; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36"
}
import requests,re,random,time
t1 = time.time()
url = 'http://jandan.net/ooxx/'
#页面地址
pages = []
for i in range(1,6):
url_g = url + 'MjAyMDAzMDctMjI' + str(i) + 'comments'
pages.append(url_g)
#下载地址
def get_pages():
pages_1 = []
pages_2 = []
for i in pages:

url_get = requests.get(i,headers=headers)
pattern1 = r'//.*?\.jpg'
pages_1 = re.findall(pattern1,url_get.text)

for i in pages_1:
pages_2.append('http:'+i)
return pages_2
for k in pages:
requests.get(k,headers=headers)
h = get_pages()
for j in h:
filename = str(random.randint(0, 999))
reqons = requests.get(j,headers=headers)
with open(filename + '.jpg', 'wb') as f:
f.write(reqons.content)
t2 = time.time()
print('共用时{}s'.format(str(t2-t1)))

ps:人生苦短,我用python
正则大法也挺好

猜你喜欢

转载自www.cnblogs.com/d-uan/p/12438690.html