千峰-python-爬取帅哥图片

老师讲解:

import requests
from bs4 import BeautifulSoup
#  1 定义url地址
url="http://www.shuaia.net/mingxing/2018-06-08/14986.html"
#2 定义文件名称记得加后缀
img_name="陈.jpg"
# 3 用requests.get方法打开url
img_req=requests.get(url=url)
# 4打印响应码看一下网页能否打开成功200 为连接成功
print("响应码",img_req)
# 5 设定字符编码 utf-8
img_req.encoding="utf-8"
#6 提取网页文本
img_text=img_req.text
#打印输出当前的网页
print(img_text)
# 7 实例化bf..进行html页面的解析
bf=BeautifulSoup(img_text,'lxml')
# 8 找到图片对应的class div
url_img=bf.find_all('div',class_="wr-single-content-list")
# 9 实例化BeautifulSoup传入上一步获取到的url_img并且转换为str作为参数传入
bf1=BeautifulSoup(str(url_img),"lxml")
# 10 通过BeautifulSoup对象.div.img.get('stc')的方式找到后半段url地址也就是图片文件的路径
url_end=bf1.div.img.get('src')
# 11 把网站主机地址和图片路径拼接在一起形成完整的图片路径
imgUrl="http://www.shuaia.net"+url_end
# 12 导入request
from urllib import request
# 13 通过request.urlretrieve()来将图片下载到本地,记得要传递完整的url地址和文件名称
request.urlretrieve(url=imgUrl,filename=img_name)
# 14 提示下载完成
print("下载图片成功")

运行结果:
这里写图片描述
我的制作:

import requests
from bs4 import BeautifulSoup
url = "http://www.shuaia.net/shuaige/2018-05-23/14975.html"
image_name = "帅哥.jpg"
img_req = requests.get(url = url)
print("响应码",img_req)
img_req.encoding = "utf-8"
img_text = img_req.text
print(img_text)
bf1 = BeautifulSoup(img_text,"lxml")
url_image = bf1.find_all("div",class_="wr-single-content-list")
bf2 = BeautifulSoup(str(url_image),"lxml")
url_end = bf2.div.img.get("src")
imgUrl="http://www.shuaia.net"+url_end
from urllib import request
request.urlretrieve(url=imgUrl,filename=image_name)
print("成功")

这里写图片描述
帅哥我还是更喜欢陈晓0.0

猜你喜欢

转载自blog.csdn.net/lijia111111/article/details/80642587