ElementTree
from xml.etree import ElementTree as ET
# xml_file = r"D:\Deep_Learning_data\yolo\gen_data\test_xml\2007_000323.xml"
root = ET.parse(xml_file).getroot()
img_name = root.find("filename").text
lxml
from lxml import etree
html = etree.HTML(open('web.html',encoding='utf-8').read()) # 容错率高
'''
选取节点
'''
# print(len(html.xpath('//div')))
# print(len(html.xpath('/html/body/div'))) # 从根节点开始查找
# print(len(html.xpath('//div/a'))) # 从全文中开始查找
# print(len(html.xpath('//div/a/..'))) # 查找该节点的父节点 . 该节点自己
# print(html.xpath("//div[@class='left']/a")) # [@class='xxx'] 查找属性