本文從以下兩個方面, 用Python實現XML的操作:
一. minidom寫入XML示例1
二. minidom寫入XML示例2
三. ElementTree寫入/修改示例
四. ElementTree讀取/修改/寫入示例
一. minidom寫入XML示例1
1.引入包
import xml.dom.minidom
2.write XML方法
writexml(writer, indent, addindent, newl, encoding) writer是文件對象 indent是每個tag前填充的字符,如:' ',則表示每個tag前有兩個空格 addindent是每個子結點的縮近字符,如下面的例子中單引號中我直接用的tab鍵 newl是每個tag后填充的字符,如:'\n',則表示每個tag后面有一個回車 encoding是生成的XML信息頭中的encoding屬性值,在輸出時minidom並不真正進行編碼的處理,如果你保存的文本內容中有漢字,則需要自已進行編碼轉換。
3.Python代碼
#xmlTest_write.py # -*- coding: utf-8 -*- import xml.dom.minidom #生成xml文件 def GenerateXml(): impl = xml.dom.minidom.getDOMImplementation() #設置根結點emps dom = impl.createDocument(None, 'emps', None) root = dom.documentElement employee = dom.createElement('emp') #增加屬性 employee.setAttribute("empno","1111") root.appendChild(employee) #設置子結點 #ename nameE=dom.createElement('ename') nameT=dom.createTextNode('傑克') nameE.appendChild(nameT) #子節點添加屬性 nameE.setAttribute("lastname","克") employee.appendChild(nameE) #age nameE=dom.createElement('age') nameT=dom.createTextNode('33') nameE.appendChild(nameT) employee.appendChild(nameE) f= open('emplist.xml', 'w') #w替換為a,追加 dom.writexml(f, addindent=' ', newl='\n') f.close() GenerateXml()
4.寫入XML結果
<?xml version="1.0" ?> <emps> <emp empno="1111"> <ename lastname="克">傑克</ename> <age>33</age> </emp> </emps>
二. minidom寫入XML示例2
1.Python代碼
#Python寫xml比較簡單,直接使用xml模塊的minidom即可對xml文件進行寫入操作 from xml.dom.minidom import Document doc = Document() people = doc.createElement("people") doc.appendChild(people) aperson = doc.createElement("person") people.appendChild(aperson) name = doc.createElement("name") aperson.appendChild(name) personname = doc.createTextNode("Annie") name.appendChild(personname) filename = "people.xml" f = open(filename, "w") f.write(doc.toprettyxml(indent=" ")) f.close()
2. 寫入XML結果
<?xml version="1.0" ?> <people> <person> <name>Annie</name> </person> </people>
三. ElementTree寫入/修改XML示例
1.寫入XMl的Python代碼
#coding=utf-8 import xml.etree.ElementTree as ET #創建根節點 root = ET.Element("root") #創建root的子節點sub1,並添加屬性 firstNode = ET.SubElement(root,"sub1") firstNode.attrib = {"name":"name attribute","age":"age attribute"} #創建子節點1(sub1)的子節點sub2,並添加數據 secondNode = ET.SubElement(firstNode,"sub2") secondNode.text = "test" #創建elementtree對象,寫文件 tree = ET.ElementTree(root) tree.write("test01.xml")
2. 寫入XML結果
<root> <sub1 age="age attribute" name="name attribute"> <sub2>test</sub2> </sub1> </root>
3. 修改XML方法
1. ElementTree.write("xmlfile"):更新xml文件 2. Element.append():為當前element對象添加子元素(element) 3. Element.set(key,value):為當前element的key屬性設置value值 4. Element.remove(element):刪除為element的節點
4. 修改XML的Python代碼
#coding=utf-8 import xml.etree.ElementTree as ET #讀取待修改文件 updateTree = ET.parse("test.xml") root = updateTree.getroot() #創建新節點並添加為root的子節點 newEle = ET.Element("NewElement") newEle.attrib = {"name":"NewElement","age":"20"} newEle.text = "This is a new element" root.append(newEle) #修改sub1的name屬性 sub1 = root.find("sub1") sub1.set("name","New Name") #修改sub2的數據值 sub2 = root.find("sub1/sub2") sub2.text = "New Value" #寫回原文件 updateTree.write("test.xml")
5. 修改XML結果
<root> <sub1 age="age attribute" name="New Name"> <sub2>New Value</sub2> </sub1> <NewElement age="20" name="NewElement">This is a new element</NewElement> </root>
四. ElementTree讀取/修改/寫入示例
1. 原始文檔內容(test.xml):
<?xml version="1.0" encoding="UTF-8"?> <framework> <processers> <processer name="AProcesser" file="lib64/A.so" path="/tmp"> </processer> <processer name="BProcesser" file="lib64/B.so" value="fordelete"> </processer> <processer name="BProcesser" file="lib64/B.so2222222"/> <services> <service name="search" prefix="/bin/search?" output_formatter="OutPutFormatter:service_inc"> <chain sequency="chain1"/> <chain sequency="chain2"></chain> </service> <service name="update" prefix="/bin/update?"> <chain sequency="chain3" value="fordelete"/> </service> </services> </processers> </framework>
2. Python操作xml代碼:
# -*- coding:utf-8 -*- ''' Created on 2018年8月30日 @author: Administrator ''' from xml.etree.ElementTree import ElementTree,Element def read_xml(in_path): '''''讀取並解析xml文件 in_path: xml路徑 return: ElementTree''' tree = ElementTree() tree.parse(in_path) return tree def write_xml(tree, out_path): '''''將xml文件寫出 tree: xml樹 out_path: 寫出路徑''' tree.write(out_path, encoding="utf-8",xml_declaration=True) def if_match(node, kv_map): '''''判斷某個節點是否包含所有傳入參數屬性 node: 節點 kv_map: 屬性及屬性值組成的map''' for key in kv_map: if node.get(key) != kv_map.get(key): return False return True #---------------search ----- def find_nodes(tree, path): '''''查找某個路徑匹配的所有節點 tree: xml樹 path: 節點路徑''' return tree.findall(path) def get_node_by_keyvalue(nodelist, kv_map): '''''根據屬性及屬性值定位符合的節點,返回節點 nodelist: 節點列表 kv_map: 匹配屬性及屬性值map''' result_nodes = [] for node in nodelist: if if_match(node, kv_map): result_nodes.append(node) return result_nodes #---------------change ----- def change_node_properties(nodelist, kv_map, is_delete=False): '''''修改/增加 /刪除 節點的屬性及屬性值 nodelist: 節點列表 kv_map:屬性及屬性值map''' for node in nodelist: for key in kv_map: if is_delete: if key in node.attrib: del node.attrib[key] else: node.set(key, kv_map.get(key)) def change_node_text(nodelist, text, is_add=False, is_delete=False): '''''改變/增加/刪除一個節點的文本 nodelist:節點列表 text : 更新后的文本''' for node in nodelist: if is_add: node.text += text elif is_delete: node.text = "" else: node.text = text def create_node(tag, property_map, content): '''''新造一個節點 tag:節點標簽 property_map:屬性及屬性值map content: 節點閉合標簽里的文本內容 return 新節點''' element = Element(tag, property_map) element.text = content return element def add_child_node(nodelist, element): '''''給一個節點添加子節點 nodelist: 節點列表 element: 子節點''' for node in nodelist: node.append(element) def del_node_by_tagkeyvalue(nodelist, tag, kv_map): '''''同過屬性及屬性值定位一個節點,並刪除之 nodelist: 父節點列表 tag:子節點標簽 kv_map: 屬性及屬性值列表''' for parent_node in nodelist: children = parent_node.getchildren() for child in children: if child.tag == tag and if_match(child, kv_map): parent_node.remove(child) if __name__ == "__main__": #1. 讀取xml文件 tree = read_xml("D://test.xml") #2. 屬性修改 #A. 找到父節點 nodes = find_nodes(tree, "processers/processer") #B. 通過屬性准確定位子節點 result_nodes = get_node_by_keyvalue(nodes, {"name":"BProcesser"}) #C. 修改節點屬性 change_node_properties(result_nodes, {"age": "1"}) #D. 刪除節點屬性 change_node_properties(result_nodes, {"value":""}, True) #3. 節點修改 #A.新建節點 a = create_node("person", {"age":"15","money":"200000"}, "this is the firest content") #B.插入到父節點之下 add_child_node(result_nodes, a) #4. 刪除節點 #定位父節點 del_parent_nodes = find_nodes(tree, "processers/services/service") #准確定位子節點並刪除之 target_del_node = del_node_by_tagkeyvalue(del_parent_nodes, "chain", {"sequency" : "chain1"}) #5. 修改節點文本 #定位節點 text_nodes = get_node_by_keyvalue(find_nodes(tree, "processers/services/service/chain"), {"sequency":"chain3"}) change_node_text(text_nodes, "new text") #6. 輸出到結果文件 write_xml(tree, "D://xiugai.xml")
3.更改之后的內容(xiugai.xml):
<?xml version='1.0' encoding='utf-8'?> <framework> <processers> <processer file="lib64/A.so" name="AProcesser" path="/tmp"> </processer> <processer age="1" file="lib64/B.so" name="BProcesser"> <person age="15" money="200000">this is the firest content</person></processer> <processer age="1" file="lib64/B.so2222222" name="BProcesser"><person age="15" money="200000">this is the firest content</person></processer> <services> <service name="search" output_formatter="OutPutFormatter:service_inc" prefix="/bin/search?"> <chain sequency="chain2" /> </service> <service name="update" prefix="/bin/update?"> <chain sequency="chain3" value="fordelete">new text</chain> </service> </services> </processers> </framework>
參考文章:
https://docs.python.org/3.5/library/xml.dom.minidom.html
https://docs.python.org/3.5/library/xml.etree.elementtree.html
https://blog.csdn.net/Tcorpion/article/details/75247168?locationNum=8&fps=1
https://blog.csdn.net/tcorpion/article/details/75244681
https://blog.csdn.net/weixin_39909877/article/details/78852287
https://www.jb51.net/article/146558.htm