これを行う方法の 2 つの例を次に示します。
from lxml import etree
import xml.etree.ElementTree as ElementTree
CONTENT = """
<process id="process1">
<log name="name1" device="device1"><![CDATA[timestamp value]]></log>
<log name="name2" device="device2"><![CDATA[timestamp value, timestamp value, timestamp]]></log>
</process>
"""
def parse_with_lxml():
root = etree.fromstring(CONTENT)
for log in root.xpath("//log"):
print log.text
def parse_with_stdlib():
root = ElementTree.fromstring(CONTENT)
for log in root.iter('log'):
print log.text
if __name__ == '__main__':
parse_with_lxml()
parse_with_stdlib()
出力:
timestamp value
timestamp value, timestamp value, timestamp
timestamp value
timestamp value, timestamp value, timestamp
どちらの場合もそれを処理するテキスト属性。