// 雙斜槓 定位根節點,會對全文進行掃描,在文檔中選取所有符合條件的內容,以列表的形式返回。
//從匹配選擇的當前節點選擇文檔中的節點,而不考慮它們的位置。
# !/usr/bin/env python
# -*- coding: utf-8 -*-
from lxml import etree
# 獲取文件元素
from lxml import etree
# 獲取文件元素
htmlEmt = etree.parse('text.xml')
# 獲取所有的 <li> 標籤
result = htmlEmt.xpath('//li')
print(result)
print type(result)
for x in result:
print x
print type(x)
print x.text
C:\Python27\python.exe C:/Users/TLCB/PycharmProjects/untitled/xpath/l1.py
[<Element li at 0x26da9e0>, <Element li at 0x26da198>, <Element li at 0x26da030>, <Element li at 0x26da0d0>, <Element li at 0x26da238>]
<type 'list'>
<Element li at 0x26da9e0>
<type 'lxml.etree._Element'>
a01
<Element li at 0x26da198>
<type 'lxml.etree._Element'>
b02
<Element li at 0x26da030>
<type 'lxml.etree._Element'>
c03
<Element li at 0x26da0d0>
<type 'lxml.etree._Element'>
d04
<Element li at 0x26da238>
<type 'lxml.etree._Element'>
e05
Process finished with exit code 0