ansible-later/testenv/lib/python2.7/site-packages/anyconfig/backend/xml.py

545 lines
18 KiB
Python
Raw Normal View History

2019-04-23 11:04:27 +00:00
#
# Copyright (C) 2011 - 2018 Satoru SATOH <ssato @ redhat.com>
# License: MIT
#
# Some XML modules may be missing and Base.{load,dumps}_impl are not overriden:
# pylint: disable=import-error, duplicate-except
# len(elem) is necessary to check that ET.Element object has children.
# pylint: disable=len-as-condition
r"""XML backend:
- Format to support: XML, e.g. http://www.w3.org/TR/xml11/
- Requirements: one of the followings
- xml.etree.cElementTree in standard lib if python >= 2.5
- xml.etree.ElementTree in standard lib if python >= 2.5
- elementtree.ElementTree (otherwise)
- Development Status :: 4 - Beta
- Limitations:
- special node '@attrs', '@text' and '@children' are used to keep XML
structure of original data. You have to cusomize them with 'tags' keyword
option to avoid any config parameters conflict with some of them.
- Some data or structures of original XML file may be lost if make it backed
to XML file; XML file - (anyconfig.load) -> config - (anyconfig.dump) ->
XML file
- XML specific features (namespace, etc.) may not be processed correctly.
- Special Options:
- ac_parse_value: Try to parse values, elements' text and attributes.
- merge_attrs: Merge attributes and mix with children nodes. Please note that
information of attributes are lost after load if this option is used.
- tags: A dict provide special parameter names to distinguish between
attributes, text and children nodes. Default is {"attrs": "@attrs", "text":
"@text", "children": "@children"}.
Changelog:
.. versionchanged:: 0.8.2
- Add special options, tags, merge_attrs and ac_parse_value
- Remove special option, pprefix which conflicts with another option tags
.. versionchanged:: 0.8.0
- Try to make a nested dict w/o extra dict having keys of attrs, text and
children from XML string/file as much as possible.
- Support namespaces partially.
.. versionchanged:: 0.1.0
- Added XML dump support.
"""
from __future__ import absolute_import
from io import BytesIO
import operator
import re
try:
import xml.etree.cElementTree as ET
except ImportError:
import xml.etree.ElementTree as ET
except ImportError:
import elementtree.ElementTree as ET
import anyconfig.backend.base
import anyconfig.compat
import anyconfig.utils
import anyconfig.parser
_TAGS = dict(attrs="@attrs", text="@text", children="@children")
_ET_NS_RE = re.compile(r"^{(\S+)}(\S+)$")
def _iterparse(xmlfile):
"""
Avoid bug in python 3.{2,3}. See http://bugs.python.org/issue9257.
:param xmlfile: XML file or file-like object
"""
try:
return ET.iterparse(xmlfile, events=("start-ns", ))
except TypeError:
return ET.iterparse(xmlfile, events=(b"start-ns", ))
def flip(tpl):
"""
>>> flip((1, 2))
(2, 1)
"""
return (tpl[1], tpl[0])
def _namespaces_from_file(xmlfile):
"""
:param xmlfile: XML file or file-like object
:return: {namespace_uri: namespace_prefix} or {}
"""
return dict(flip(t) for _, t in _iterparse(xmlfile))
def _tweak_ns(tag, **options):
"""
:param tag: XML tag element
:param nspaces: A namespaces dict, {uri: prefix}
:param options: Extra keyword options may contain 'nspaces' keyword option
provide a namespace dict, {uri: prefix}
>>> _tweak_ns("a", nspaces={})
'a'
>>> _tweak_ns("a", nspaces={"http://example.com/ns/val/": "val"})
'a'
>>> _tweak_ns("{http://example.com/ns/val/}a",
... nspaces={"http://example.com/ns/val/": "val"})
'val:a'
"""
nspaces = options.get("nspaces", None)
if nspaces is not None:
matched = _ET_NS_RE.match(tag)
if matched:
(uri, tag) = matched.groups()
prefix = nspaces.get(uri, False)
if prefix:
return "%s:%s" % (prefix, tag)
return tag
def _dicts_have_unique_keys(dics):
"""
:param dics: [<dict or dict-like object>], must not be [] or [{...}]
:return: True if all keys of each dict of `dics` are unique
# Enable the followings if to allow dics is [], [{...}]:
# >>> all(_dicts_have_unique_keys([d]) for [d]
# ... in ({}, {'a': 0}, {'a': 1, 'b': 0}))
# True
# >>> _dicts_have_unique_keys([{}, {'a': 1}, {'b': 2, 'c': 0}])
# True
>>> _dicts_have_unique_keys([{}, {'a': 1}, {'a': 2}])
False
>>> _dicts_have_unique_keys([{}, {'a': 1}, {'b': 2}, {'b': 3, 'c': 0}])
False
>>> _dicts_have_unique_keys([{}, {}])
True
"""
key_itr = anyconfig.compat.from_iterable(d.keys() for d in dics)
return len(set(key_itr)) == sum(len(d) for d in dics)
def _merge_dicts(dics, container=dict):
"""
:param dics: [<dict/-like object must not have same keys each other>]
:param container: callble to make a container object
:return: <container> object
>>> _merge_dicts(({}, ))
{}
>>> _merge_dicts(({'a': 1}, ))
{'a': 1}
>>> sorted(kv for kv in _merge_dicts(({'a': 1}, {'b': 2})).items())
[('a', 1), ('b', 2)]
"""
dic_itr = anyconfig.compat.from_iterable(d.items() for d in dics)
return container(anyconfig.compat.OrderedDict(dic_itr))
def _parse_text(val, **options):
"""
:return: Parsed value or value itself depends on `ac_parse_value`
"""
if val and options.get("ac_parse_value", False):
return anyconfig.parser.parse_single(val)
return val
def _process_elem_text(elem, dic, subdic, text="@text", **options):
"""
:param elem: ET Element object which has elem.text
:param dic: <container> (dict[-like]) object converted from elem
:param subdic: Sub <container> object converted from elem
:param options:
Keyword options, see the description of :func:`elem_to_container` for
more details.
:return: None but updating elem.text, dic and subdic as side effects
"""
elem.text = elem.text.strip()
if elem.text:
etext = _parse_text(elem.text, **options)
if len(elem) or elem.attrib:
subdic[text] = etext
else:
dic[elem.tag] = etext # Only text, e.g. <a>text</a>
def _parse_attrs(elem, container=dict, **options):
"""
:param elem: ET Element object has attributes (elem.attrib)
:param container: callble to make a container object
:return: Parsed value or value itself depends on `ac_parse_value`
"""
adic = dict((_tweak_ns(a, **options), v) for a, v in elem.attrib.items())
if options.get("ac_parse_value", False):
return container(dict((k, anyconfig.parser.parse_single(v))
for k, v in adic.items()))
return container(adic)
def _process_elem_attrs(elem, dic, subdic, container=dict, attrs="@attrs",
**options):
"""
:param elem: ET Element object or None
:param dic: <container> (dict[-like]) object converted from elem
:param subdic: Sub <container> object converted from elem
:param options:
Keyword options, see the description of :func:`elem_to_container` for
more details.
:return: None but updating dic and subdic as side effects
"""
adic = _parse_attrs(elem, container=container, **options)
if not elem.text and not len(elem) and options.get("merge_attrs"):
dic[elem.tag] = adic
else:
subdic[attrs] = adic
def _process_children_elems(elem, dic, subdic, container=dict,
children="@children", **options):
"""
:param elem: ET Element object or None
:param dic: <container> (dict[-like]) object converted from elem
:param subdic: Sub <container> object converted from elem
:param container: callble to make a container object
:param children: Tag for children nodes
:param options:
Keyword options, see the description of :func:`elem_to_container` for
more details.
:return: None but updating dic and subdic as side effects
"""
cdics = [elem_to_container(c, container=container, **options)
for c in elem]
merge_attrs = options.get("merge_attrs", False)
sdics = [container(elem.attrib) if merge_attrs else subdic] + cdics
if _dicts_have_unique_keys(sdics): # ex. <a><b>1</b><c>c</c></a>
dic[elem.tag] = _merge_dicts(sdics, container)
elif not subdic: # There are no attrs nor text and only these children.
dic[elem.tag] = cdics
else:
subdic[children] = cdics
def elem_to_container(elem, container=dict, **options):
"""
Convert XML ElementTree Element to a collection of container objects.
Elements are transformed to a node under special tagged nodes, attrs, text
and children, to store the type of these elements basically, however, in
some special cases like the followings, these nodes are attached to the
parent node directly for later convenience.
- There is only text element
- There are only children elements each has unique keys among all
:param elem: ET Element object or None
:param container: callble to make a container object
:param options: Keyword options
- nspaces: A namespaces dict, {uri: prefix} or None
- attrs, text, children: Tags for special nodes to keep XML info
- merge_attrs: Merge attributes and mix with children nodes, and the
information of attributes are lost after its transformation.
"""
dic = container()
if elem is None:
return dic
elem.tag = _tweak_ns(elem.tag, **options) # {ns}tag -> ns_prefix:tag
subdic = dic[elem.tag] = container()
options["container"] = container
if elem.text:
_process_elem_text(elem, dic, subdic, **options)
if elem.attrib:
_process_elem_attrs(elem, dic, subdic, **options)
if len(elem):
_process_children_elems(elem, dic, subdic, **options)
elif not elem.text and not elem.attrib: # ex. <tag/>.
dic[elem.tag] = None
return dic
def _complement_tag_options(options):
"""
:param options: Keyword options :: dict
>>> ref = _TAGS.copy()
>>> ref["text"] = "#text"
>>> opts = _complement_tag_options({"tags": {"text": ref["text"]}})
>>> del opts["tags"] # To simplify comparison.
>>> sorted(opts.items())
[('attrs', '@attrs'), ('children', '@children'), ('text', '#text')]
"""
if not all(nt in options for nt in _TAGS):
tags = options.get("tags", {})
for ntype, tag in _TAGS.items():
options[ntype] = tags.get(ntype, tag)
return options
def root_to_container(root, container=dict, nspaces=None, **options):
"""
Convert XML ElementTree Root Element to a collection of container objects.
:param root: etree root object or None
:param container: callble to make a container object
:param nspaces: A namespaces dict, {uri: prefix} or None
:param options: Keyword options,
- tags: Dict of tags for special nodes to keep XML info, attributes,
text and children nodes, e.g. {"attrs": "@attrs", "text": "#text"}
"""
tree = container()
if root is None:
return tree
if nspaces is not None:
for uri, prefix in nspaces.items():
root.attrib["xmlns:" + prefix if prefix else "xmlns"] = uri
return elem_to_container(root, container=container, nspaces=nspaces,
**_complement_tag_options(options))
def _to_str_fn(**options):
"""
:param options: Keyword options might have 'ac_parse_value' key
:param to_str: Callable to convert value to string
"""
return str if options.get("ac_parse_value") else anyconfig.utils.noop
def _elem_set_attrs(obj, parent, to_str):
"""
:param obj: Container instance gives attributes of XML Element
:param parent: XML ElementTree parent node object
:param to_str: Callable to convert value to string or None
:param options: Keyword options, see :func:`container_to_etree`
:return: None but parent will be modified
"""
for attr, val in anyconfig.compat.iteritems(obj):
parent.set(attr, to_str(val))
def _elem_from_descendants(children_nodes, **options):
"""
:param children_nodes: A list of child dict objects
:param options: Keyword options, see :func:`container_to_etree`
"""
for child in children_nodes: # child should be a dict-like object.
for ckey, cval in anyconfig.compat.iteritems(child):
celem = ET.Element(ckey)
container_to_etree(cval, parent=celem, **options)
yield celem
def _get_or_update_parent(key, val, to_str, parent=None, **options):
"""
:param key: Key of current child (dict{,-like} object)
:param val: Value of current child (dict{,-like} object or [dict{,...}])
:param to_str: Callable to convert value to string
:param parent: XML ElementTree parent node object or None
:param options: Keyword options, see :func:`container_to_etree`
"""
elem = ET.Element(key)
vals = val if anyconfig.utils.is_iterable(val) else [val]
for val_ in vals:
container_to_etree(val_, parent=elem, to_str=to_str, **options)
if parent is None: # 'elem' is the top level etree.
return elem
parent.append(elem)
return parent
_ATC = ("attrs", "text", "children")
def container_to_etree(obj, parent=None, to_str=None, **options):
"""
Convert a dict-like object to XML ElementTree.
:param obj: Container instance to convert to
:param parent: XML ElementTree parent node object or None
:param to_str: Callable to convert value to string or None
:param options: Keyword options,
- tags: Dict of tags for special nodes to keep XML info, attributes,
text and children nodes, e.g. {"attrs": "@attrs", "text": "#text"}
"""
if to_str is None:
to_str = _to_str_fn(**options)
if not anyconfig.utils.is_dict_like(obj):
if parent is not None and obj:
parent.text = to_str(obj) # Parent is a leaf text node.
return parent # All attributes and text should be set already.
options = _complement_tag_options(options)
(attrs, text, children) = operator.itemgetter(*_ATC)(options)
for key, val in anyconfig.compat.iteritems(obj):
if key == attrs:
_elem_set_attrs(val, parent, to_str)
elif key == text:
parent.text = to_str(val)
elif key == children:
for celem in _elem_from_descendants(val, **options):
parent.append(celem)
else:
parent = _get_or_update_parent(key, val, to_str, parent=parent,
**options)
return ET.ElementTree(parent)
def etree_write(tree, stream):
"""
Write XML ElementTree `root` content into `stream`.
.. note:
It seems that ET.ElementTree.write() cannot process a parameter
'xml_declaration' in python 2.6.
:param tree: XML ElementTree object
:param stream: File or file-like object can write to
"""
if anyconfig.compat.IS_PYTHON_2_6:
tree.write(stream, encoding='UTF-8')
else:
tree.write(stream, encoding='UTF-8', xml_declaration=True)
class Parser(anyconfig.backend.base.Parser,
anyconfig.backend.base.ToStreamDumperMixin,
anyconfig.backend.base.BinaryFilesMixin):
"""
Parser for XML files.
"""
_type = "xml"
_extensions = ["xml"]
_load_opts = _dump_opts = ["tags", "merge_attrs", "ac_parse_value"]
_ordered = True
_dict_opts = ["ac_dict"]
def load_from_string(self, content, container, **opts):
"""
Load config from XML snippet (a string `content`).
:param content:
XML snippet string of str (python 2) or bytes (python 3) type
:param container: callble to make a container object
:param opts: optional keyword parameters passed to
:return: Dict-like object holding config parameters
"""
root = ET.fromstring(content)
if anyconfig.compat.IS_PYTHON_3:
stream = BytesIO(content)
else:
stream = anyconfig.compat.StringIO(content)
nspaces = _namespaces_from_file(stream)
return root_to_container(root, container=container,
nspaces=nspaces, **opts)
def load_from_path(self, filepath, container, **opts):
"""
:param filepath: XML file path
:param container: callble to make a container object
:param opts: optional keyword parameters to be sanitized
:return: Dict-like object holding config parameters
"""
root = ET.parse(filepath).getroot()
nspaces = _namespaces_from_file(filepath)
return root_to_container(root, container=container,
nspaces=nspaces, **opts)
def load_from_stream(self, stream, container, **opts):
"""
:param stream: XML file or file-like object
:param container: callble to make a container object
:param opts: optional keyword parameters to be sanitized
:return: Dict-like object holding config parameters
"""
root = ET.parse(stream).getroot()
path = anyconfig.utils.get_path_from_stream(stream)
nspaces = _namespaces_from_file(path)
return root_to_container(root, container=container,
nspaces=nspaces, **opts)
def dump_to_string(self, cnf, **opts):
"""
:param cnf: Configuration data to dump
:param opts: optional keyword parameters
:return: string represents the configuration
"""
tree = container_to_etree(cnf, **opts)
buf = BytesIO()
etree_write(tree, buf)
return buf.getvalue()
def dump_to_stream(self, cnf, stream, **opts):
"""
:param cnf: Configuration data to dump
:param stream: Config file or file like object write to
:param opts: optional keyword parameters
"""
tree = container_to_etree(cnf, **opts)
etree_write(tree, stream)
# vim:sw=4:ts=4:et: