lxml库 lxml库from lxml import etreehtml = etree.HTML(text)# 也可进行格式解析html = etree.HTML('test.html',etree.HTMLParser()) 而后可进行html.xpath