'''
参考文档:http://docs.python-requests.org/zh_CN/latest/user/quickstart.html requests
https://www.crummy.com/software/BeautifulSoup/bs4/doc/index.zh.html bs4
'''
# -*- coding: UTF-8 -*-
from bs4 import BeautifulSoup
import requests
url='http://www.hnxcdb.com/readgg.asp?id=1623'
html=requests.get(url)
html.encoding='gb2312' # 查看网页编码
html=html.text
content=BeautifulSoup(html,'html.parser').tbody # 定位tag
res=[]
for ele in content.find_all('tr'):
a=[]
for ele1 in ele.find_all('td'):
if not ele1.string is None:
a.append(ele1.string.strip())
print(a)
temp=','.join(a)
res.append(temp)
利用python bs4爬取企业逾期数据
猜你喜欢
转载自blog.csdn.net/huangqihao723/article/details/81712863
今日推荐
周排行