from lxml import etreeif __name__=="__main__":tree=etree.parse('test.html')# r=tree.xpath('/html/body/div')# r = tree.xpath('/html//div')# r = tree.xpath('//div')# r = tree.xpath('//div[@class="song"]')# r = tree.xpath('//div[@class="song"]/p[3]') #索引从1开始# r = tree.xpath('//div[@class="tang"]//li[5]/a/text()')[0] #/text()获取标签下直系文本内容# r = tree.xpath('//div[@class="tang"]//text()') #//text()获取标签下所有文本内容r = tree.xpath('//div[@class="song"]/img/@src')print(r)
