1. from lxml import etree
    2. if __name__=="__main__":
    3. tree=etree.parse('test.html')
    4. # r=tree.xpath('/html/body/div')
    5. # r = tree.xpath('/html//div')
    6. # r = tree.xpath('//div')
    7. # r = tree.xpath('//div[@class="song"]')
    8. # r = tree.xpath('//div[@class="song"]/p[3]') #索引从1开始
    9. # r = tree.xpath('//div[@class="tang"]//li[5]/a/text()')[0] #/text()获取标签下直系文本内容
    10. # r = tree.xpath('//div[@class="tang"]//text()') #//text()获取标签下所有文本内容
    11. r = tree.xpath('//div[@class="song"]/img/@src')
    12. print(r)