import requests
from bs4 import BeautifulSoup
url = "http://mxd.sdo.com/web6/home/index.asp"
headers={'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36'}
html_code = requests.get(url,headers=headers)
soup = BeautifulSoup(html_code.text,"html.parser")
soup_1 = soup.find("div",attrs={"class","news-list"})
soup_2 = soup_1.find_all("a")
i= 0
for ele in soup_2:
# print(i,"-", ele)
kw = "更多"
if kw in ele:
pass
else:
i = i + 1
if ".." in ele.get("href"):
print(i, "-", ele.get_text(), "-","http://mxd.sdo.com/web6"+ ele.get("href").replace("..",""))
else:
print(i, "-", ele.get_text(), "-",ele.get("href"))
输出:
1 - 全新版本荣耀上线 新的战役即将拉开序幕 - http://act.mxd.sdo.com/project/v168/
2 - “斗鱼杯”冒险岛开荒升级竞速赛即将打响! - https://m.douyu.com/232838
3 - 皇家礼品袋更新 懒懒胖胖小企鹅 - http://mxd.sdo.com/web6/news/newsContent.asp?ID=313560&CategoryID=273
4 - 满载珍宝与惊喜的魔法马车驾到!手慢则无! - http://mxd.sdo.com/web6/news/newsContent.asp?ID=310549&CategoryID=274
5 - 转蛋万花筒更新 荣耀勇士的极品之选 - http://mxd.sdo.com/web6/news/newsContent.asp?ID=313466&CategoryID=273
6 - 品克缤敲敲乐更新 神秘之影防具爆率提升3倍 - http://mxd.sdo.com/web6/news/newsContent.asp?ID=313465&CategoryID=273
7 - 皇家脸型最新发布 童言无忌小可爱 - http://mxd.sdo.com/web6/news/newsContent.asp?ID=313464&CategoryID=273
8 - 皇家发型最新发布 香甜的焦糖少年少女 - http://mxd.sdo.com/web6/news/newsContent.asp?ID=313463&CategoryID=273
9 - 三九寒冬添置冬衣 家具栏扩展券为你准备充足空间 - http://act.mxd.sdo.com/project/v168/a06.html#con
10 - 成为新时代的记录者 记录那一天之后的新篇章 - http://act.mxd.sdo.com/project/v168/a06.html#con