xml 读取

ElementTree


from xml.etree import ElementTree as ET

# xml_file = r"D:\Deep_Learning_data\yolo\gen_data\test_xml\2007_000323.xml"
root = ET.parse(xml_file).getroot()
img_name = root.find("filename").text

lxml

from lxml import etree

html = etree.HTML(open('web.html',encoding='utf-8').read())  # 容错率高
'''
    选取节点
'''
# print(len(html.xpath('//div')))
# print(len(html.xpath('/html/body/div')))     # 从根节点开始查找
# print(len(html.xpath('//div/a')))            # 从全文中开始查找
# print(len(html.xpath('//div/a/..')))         # 查找该节点的父节点 . 该节点自己
# print(html.xpath("//div[@class='left']/a"))  # [@class='xxx']  查找属性

猜你喜欢

转载自blog.csdn.net/luolinll1212/article/details/85005724