爬虫 -- 必应壁纸

import requests
import urllib.request
import uuid
from bs4 import BeautifulSoup
import os

if os.path.exists('/home/dell/Pictures') == True:  # 如果目录不存在则创建
    print("image dir is exsit")
else:
    os.mkdir('image')
i = 0
for page in range(1,50):
    url = 'https://bing.ioliu.cn/?p='+str(page)
    #print(url)
    r = requests.get(url)
    contents = r.text

    soup = BeautifulSoup(contents,'html.parser')
    divs = soup.find_all('div','item')

    for div in divs:
        imgs = div.find_all('img')
        for img in imgs:
            print(img['src'].replace('2560x1440','2560x1440'))
            urllib.request.urlretrieve(img['src'].replace('2560x1440','2560x1440'),'/home/dell/Pictures/%s.jpg'%i)
            i += 1
            print('成功抓取第%s张图片'%i)
print('共抓取'+str(i)+'张图片')

发布了88 篇原创文章 · 获赞 5 · 访问量 7964

猜你喜欢

转载自blog.csdn.net/bornfree5511/article/details/103931806