1.问题描述
属性无序问题和xml声明不是单独一行
# cat HKEX-EPS_20180830_003249795.xml
>1400
达到效果:
cat HKEX-EPS_20180830_003249795.xml
>
1400
2操作步骤
2.1环境说明
系统自带python2.6.6 升级为 python2.7.10
如果没有升级python2.7,
>>> import sys
>>> sys.path
路径为 /usr/lib64/python2.6/xml/dom
使用的模块是
import xml.dom.minidom
2.2换行处理
# cd /usr/local/lib/python2.7/xml/dom/
原始配置
def writexml(self, writer, indent="", addindent="", newl="",
encoding = None):
if encoding is None:
writer.write(''+newl)
else:
writer.write('%s' % (encoding, newl))
for node in self.childNodes:
node.writexml(writer, indent, addindent, newl)
修改配置
def writexml(self, writer, indent="", addindent="", newl="",
encoding = None):
if encoding is None:
writer.write(''+'\n')
else:
writer.write('%s' % (encoding, '\n'))
for node in self.childNodes:
node.writexml(writer, indent, addindent, newl)
2.3属性有序处理
原始配置
def __init__(self, tagName, namespaceURI=EMPTY_NAMESPACE, prefix=None,
localName=None):
self.tagName = self.nodeName = tagName
self.prefix = prefix
self.namespaceURI = namespaceURI
self.childNodes = NodeList()
self._attrs = {} # attributes are double-indexed:
self._attrsNS = {} # tagName -> Attribute
# URI,localName -> Attribute
# in the future: consider lazy generation
# of attribute objects this is too tricky
# for now because of headaches with
# namespaces.
......
def writexml(self, writer, indent="", addindent="", newl=""):
# indent = current indentation
# addindent = indentation to add to higher levels
# newl = newline string
writer.write(indent+"<" + self.tagName)
attrs = self._get_attributes()
a_names = attrs.keys()
a_names.sort()
修改配置:
def __init__(self, tagName, namespaceURI=EMPTY_NAMESPACE, prefix=None,
localName=None):
self.tagName = self.nodeName = tagName
self.prefix = prefix
self.namespaceURI = namespaceURI
self.childNodes = NodeList()
#self._attrs = {} # attributes are double-indexed:
self._attrs = OrderedDict() # attributes are double-indexed:
self._attrsNS = {} # tagName -> Attribute
# URI,localName -> Attribute
# in the future: consider lazy generation
# of attribute objects this is too tricky
# for now because of headaches with
# namespaces.
......
def writexml(self, writer, indent="", addindent="", newl=""):
# indent = current indentation
# addindent = indentation to add to higher levels
# newl = newline string
writer.write(indent+"<" + self.tagName)
attrs = self._get_attributes()
a_names = attrs.keys()
#a_names.sort()
3.总结
亲测可用