利用python bs4爬取企业逾期数据


'''
参考文档:http://docs.python-requests.org/zh_CN/latest/user/quickstart.html  requests

https://www.crummy.com/software/BeautifulSoup/bs4/doc/index.zh.html bs4

'''

# -*- coding: UTF-8 -*-

from bs4 import BeautifulSoup
import  requests

url='http://www.hnxcdb.com/readgg.asp?id=1623'
html=requests.get(url)
html.encoding='gb2312'   # 查看网页编码
html=html.text
content=BeautifulSoup(html,'html.parser').tbody  # 定位tag

res=[]
for ele in content.find_all('tr'):
    a=[]
    for ele1 in ele.find_all('td'):
        if not ele1.string is None:
            a.append(ele1.string.strip())
    print(a)
    temp=','.join(a)
    res.append(temp)

猜你喜欢

转载自blog.csdn.net/huangqihao723/article/details/81712863