BeautifulSoup爬虫

一个范例

from bs4 import BeautifulSoup
import requests
#原始网页文件
url = r'http://guba.eastmoney.com/'
r = requests.get(url)
html = r.text

#第一层解析
soup = BeautifulSoup(html,"html.parser")
#获取指定id的div模块
div = soup.find_all('div',id="hotArticle")

#div要转换str格式然后再塞入soup解析
soup2 = BeautifulSoup(str(div),"html.parser")
#div要转换str格式然后再塞入soup解析
soup2 = BeautifulSoup(str(div),"html.parser")


n = 0
li = ''
for i in soup2.find_all('a'):
    if n%2 != 0:
        print(i.string)
        li = li + i.string
    n+=1

猜你喜欢

转载自www.cnblogs.com/yukizzc/p/12525650.html