python 使用python3.4解析xml文件(sax、dom、etree)
调用sax模块处理xml文件。
#重载了三个方法
#处理xml,主要就是写自己的事件处理类
from xml.sax import *
class DengHandler(ContentHandler):
    def startDocument(self):
        print("----开始解析xml文档----")
    def endDocument(self):
        print("----xml文档解析完毕----")
    def startElement(self,name,attrs):
        if name == "author":
            print("名字:",attrs['name']," 日期:",attrs["birth"])
parse("deng.xml",DengHandler())
deng.xml
<?xml version = "1.0" encoding = "utf-8"?>
    <author name = "dengjingdong" birth = "19920517"></author>
</people>
调用dom模块中的minidom处理xml文件。
from xml.dom.minidom import *
#scannode函数打印xml文件的结构
def scannode(doc,level = 0):
    ret = doc.__class__.__name__
    if doc.nodeType == Node.ELEMENT_NODE:
        ret += ",标签:" + doc.tagName
    print(" "*4*level,ret)
    if doc.hasChildNodes:
        for child in doc.childNodes:
            scannode(child,level+1)
#----scannode-----
xin = parse("book.xml")
print(xin)
scannode(xin)
#----scannode-----
x = parse("domtest.xml")
nx = x.getElementsByTagName("author")
print(nx[0].getAttribute("birth"))
print(nx[0].childNodes[0].data)
print(nx[1].getAttribute("birth"))
print(nx[1].childNodes[0].data)
book.xml
<?xml version = "1.0" encoding = "utf-8" ?>
<book>
    <title>the book title</title>
    <author>
        <name>jingdong</name>
        <boy>true</boy>
    </author>
    <chapter number = "1">
        <title> first chapter </title>
        <para>
            I love python.
        </para>
    </chapter>
</book>
domtest.xml
<?xml version = "1.0" encoding = "utf-8" ?>
<people>
    <author name = "dengjingdong" birth = "1990517">dongdong</author>
    <author name = "wushengnan" birth = "19920520">nannan</author>
</people>
调用etree模块中的ElementTree生成所需的xml文件。
import xml.etree.ElementTree as et
x = et.Element("name")
x.text = "dengjingdong"
x.set("boy","true")
sx = et.tostring(x)
print(sx)
