debian-xmlschema/xmlschema/validators/identities.py

363 lines
14 KiB
Python

# -*- coding: utf-8 -*-
#
# Copyright (c), 2016-2019, SISSA (International School for Advanced Studies).
# All rights reserved.
# This file is distributed under the terms of the MIT License.
# See the file 'LICENSE' in the root directory of the present
# distribution, or http://opensource.org/licenses/MIT.
#
# @author Davide Brunato <brunato@sissa.it>
#
"""
This module contains classes for other XML Schema identity constraints.
"""
from __future__ import unicode_literals
import re
from collections import Counter
from elementpath import Selector, XPath1Parser, ElementPathError
from ..exceptions import XMLSchemaValueError
from ..qnames import XSD_ANNOTATION, XSD_QNAME, XSD_UNIQUE, XSD_KEY, XSD_KEYREF, \
XSD_SELECTOR, XSD_FIELD, get_qname, qname_to_prefixed, qname_to_extended
from ..etree import etree_getpath
from ..regex import get_python_regex
from .exceptions import XMLSchemaValidationError
from .xsdbase import XsdComponent
XSD_IDENTITY_XPATH_SYMBOLS = {
'processing-instruction', 'following-sibling', 'preceding-sibling',
'ancestor-or-self', 'attribute', 'following', 'namespace', 'preceding',
'ancestor', 'position', 'comment', 'parent', 'child', 'false', 'text', 'node',
'true', 'last', 'not', 'and', 'mod', 'div', 'or', '..', '//', '!=', '<=', '>=', '(', ')',
'[', ']', '.', '@', ',', '/', '|', '*', '-', '=', '+', '<', '>', ':', '(end)', '(name)',
'(string)', '(float)', '(decimal)', '(integer)', '::'
}
class XsdIdentityXPathParser(XPath1Parser):
symbol_table = {k: v for k, v in XPath1Parser.symbol_table.items() if k in XSD_IDENTITY_XPATH_SYMBOLS}
SYMBOLS = XSD_IDENTITY_XPATH_SYMBOLS
XsdIdentityXPathParser.build_tokenizer()
class XsdSelector(XsdComponent):
"""Class for defining an XPath selector for an XSD identity constraint."""
_ADMITTED_TAGS = {XSD_SELECTOR}
pattern = re.compile(get_python_regex(
r"(\.//)?(((child::)?((\i\c*:)?(\i\c*|\*)))|\.)(/(((child::)?((\i\c*:)?(\i\c*|\*)))|\.))*(\|"
r"(\.//)?(((child::)?((\i\c*:)?(\i\c*|\*)))|\.)(/(((child::)?((\i\c*:)?(\i\c*|\*)))|\.))*)*"
))
def __init__(self, elem, schema, parent):
super(XsdSelector, self).__init__(elem, schema, parent)
def _parse(self):
super(XsdSelector, self)._parse()
try:
self.path = self.elem.attrib['xpath']
except KeyError:
self.parse_error("'xpath' attribute required:", self.elem)
self.path = "*"
else:
if not self.pattern.match(self.path.replace(' ', '')):
self.parse_error("Wrong XPath expression for an xs:selector")
try:
self.xpath_selector = Selector(self.path, self.namespaces, parser=XsdIdentityXPathParser)
except ElementPathError as err:
self.parse_error(err)
self.xpath_selector = Selector('*', self.namespaces, parser=XsdIdentityXPathParser)
# XSD 1.1 xpathDefaultNamespace attribute
if self.schema.XSD_VERSION > '1.0':
if 'xpathDefaultNamespace' in self.elem.attrib:
self.xpath_default_namespace = self._parse_xpath_default_namespace(self.elem)
else:
self.xpath_default_namespace = self.schema.xpath_default_namespace
def __repr__(self):
return '%s(path=%r)' % (self.__class__.__name__, self.path)
@property
def built(self):
return True
class XsdFieldSelector(XsdSelector):
"""Class for defining an XPath field selector for an XSD identity constraint."""
_ADMITTED_TAGS = {XSD_FIELD}
pattern = re.compile(get_python_regex(
r"(\.//)?((((child::)?((\i\c*:)?(\i\c*|\*)))|\.)/)*((((child::)?((\i\c*:)?(\i\c*|\*)))|\.)|"
r"((attribute::|@)((\i\c*:)?(\i\c*|\*))))(\|(\.//)?((((child::)?((\i\c*:)?(\i\c*|\*)))|\.)/)*"
r"((((child::)?((\i\c*:)?(\i\c*|\*)))|\.)|((attribute::|@)((\i\c*:)?(\i\c*|\*)))))*"
))
class XsdIdentity(XsdComponent):
"""
Common class for XSD identity constraints.
:ivar selector: the XPath selector of the identity constraint.
:ivar fields: a list containing the XPath field selectors of the identity constraint.
"""
selector = None
fields = ()
def __init__(self, elem, schema, parent):
super(XsdIdentity, self).__init__(elem, schema, parent)
def _parse(self):
super(XsdIdentity, self)._parse()
elem = self.elem
try:
self.name = get_qname(self.target_namespace, elem.attrib['name'])
except KeyError:
self.parse_error("missing required attribute 'name'", elem)
self.name = None
for index, child in enumerate(elem):
if child.tag == XSD_SELECTOR:
self.selector = XsdSelector(child, self.schema, self)
break
elif child.tag != XSD_ANNOTATION:
self.parse_error("'selector' declaration expected.", elem)
break
else:
self.parse_error("missing 'selector' declaration.", elem)
index = -1
self.fields = []
for child in filter(lambda x: x.tag != XSD_ANNOTATION, elem[index + 1:]):
if child.tag == XSD_FIELD:
self.fields.append(XsdFieldSelector(child, self.schema, self))
else:
self.parse_error("element %r not allowed here:" % child.tag, elem)
def _parse_identity_reference(self):
super(XsdIdentity, self)._parse()
self.name = get_qname(self.target_namespace, self.elem.attrib['ref'])
if 'name' in self.elem.attrib:
self.parse_error("attributes 'name' and 'ref' are mutually exclusive")
elif self._parse_child_component(self.elem) is not None:
self.parse_error("a reference cannot has child definitions")
def iter_elements(self):
for xsd_element in self.selector.xpath_selector.iter_select(self.parent):
yield xsd_element
def get_fields(self, context, namespaces=None, decoders=None):
"""
Get fields for a schema or instance context element.
:param context: context Element or XsdElement
:param namespaces: is an optional mapping from namespace prefix to URI.
:param decoders: context schema fields decoders.
:return: a tuple with field values. An empty field is replaced by `None`.
"""
fields = []
for k, field in enumerate(self.fields):
result = field.xpath_selector.select(context)
if not result:
if not isinstance(self, XsdKey) or 'ref' in context.attrib and \
self.schema.meta_schema is None and self.schema.XSD_VERSION != '1.0':
fields.append(None)
else:
raise XMLSchemaValueError("%r key field must have a value!" % field)
elif len(result) == 1:
if decoders is None or decoders[k] is None:
fields.append(result[0])
else:
value = decoders[k].data_value(result[0])
if decoders[k].type.root_type.name == XSD_QNAME:
value = qname_to_extended(value, namespaces)
if isinstance(value, list):
fields.append(tuple(value))
else:
fields.append(value)
else:
raise XMLSchemaValueError("%r field selects multiple values!" % field)
return tuple(fields)
def iter_values(self, elem, namespaces):
"""
Iterate field values, excluding empty values (tuples with all `None` values).
:param elem: instance XML element.
:param namespaces: XML document namespaces.
:return: N-Tuple with value fields.
"""
current_path = ''
xsd_fields = None
for e in self.selector.xpath_selector.iter_select(elem):
path = etree_getpath(e, elem)
if current_path != path:
# Change the XSD context only if the path is changed
current_path = path
xsd_element = self.parent.find(path)
if not hasattr(xsd_element, 'tag'):
yield XMLSchemaValidationError(self, e, "{!r} is not an element".format(xsd_element))
xsd_fields = self.get_fields(xsd_element)
if all(fld is None for fld in xsd_fields):
continue
try:
fields = self.get_fields(e, namespaces, decoders=xsd_fields)
except XMLSchemaValueError as err:
yield XMLSchemaValidationError(self, e, reason=str(err))
else:
if any(fld is not None for fld in fields):
yield fields
@property
def built(self):
return self.selector is not None
def __call__(self, elem, namespaces):
values = Counter()
for v in self.iter_values(elem, namespaces):
if isinstance(v, XMLSchemaValidationError):
yield v
else:
values[v] += 1
for value, count in values.items():
if value and count > 1:
yield XMLSchemaValidationError(self, elem, reason="duplicated value {!r}.".format(value))
class XsdUnique(XsdIdentity):
_ADMITTED_TAGS = {XSD_UNIQUE}
class XsdKey(XsdIdentity):
_ADMITTED_TAGS = {XSD_KEY}
class XsdKeyref(XsdIdentity):
"""
Implementation of xs:keyref.
:ivar refer: reference to a *xs:key* declaration that must be in the same element \
or in a descendant element.
"""
_ADMITTED_TAGS = {XSD_KEYREF}
refer = None
refer_path = '.'
def __repr__(self):
return '%s(name=%r, refer=%r)' % (
self.__class__.__name__, self.prefixed_name, getattr(self.refer, 'prefixed_name', None)
)
def _parse(self):
super(XsdKeyref, self)._parse()
try:
self.refer = self.schema.resolve_qname(self.elem.attrib['refer'])
except (KeyError, ValueError, RuntimeError) as err:
if 'refer' not in self.elem.attrib:
self.parse_error("missing required attribute 'refer'")
else:
self.parse_error(err)
def parse_refer(self):
if self.refer is None:
return # attribute or key/unique identity constraint missing
elif isinstance(self.refer, (XsdKey, XsdUnique)):
return # referenced key/unique identity constraint already set
refer = self.parent.identities.get(self.refer)
if refer is not None and refer.ref is None:
self.refer = refer
else:
try:
self.refer = self.maps.identities[self.refer]
except KeyError:
self.parse_error("key/unique identity constraint %r is missing" % self.refer)
return
if not isinstance(self.refer, (XsdKey, XsdUnique)):
self.parse_error("reference to a non key/unique identity constraint %r" % self.refer)
elif len(self.refer.fields) != len(self.fields):
self.parse_error("field cardinality mismatch between %r and %r" % (self, self.refer))
elif self.parent is not self.refer.parent:
refer_path = self.refer.parent.get_path(ancestor=self.parent)
if refer_path is None:
# From a note in par. 3.11.5 Part 1 of XSD 1.0 spec: "keyref identity-constraints may be
# defined on domains distinct from the embedded domain of the identity-constraint they
# reference, or the domains may be the same but self-embedding at some depth. In either
# case the node table for the referenced identity-constraint needs to propagate upwards,
# with conflict resolution."
refer_path = self.parent.get_path(ancestor=self.refer.parent, reverse=True)
if refer_path is None:
refer_path = self.parent.get_path(reverse=True) + '/' + self.refer.parent.get_path()
self.refer_path = refer_path
@property
def built(self):
return self.selector is not None and isinstance(self.refer, XsdIdentity)
def get_refer_values(self, elem, namespaces):
values = set()
for e in elem.iterfind(self.refer_path):
for v in self.refer.iter_values(e, namespaces):
if not isinstance(v, XMLSchemaValidationError):
values.add(v)
return values
def __call__(self, elem, namespaces):
if self.refer is None:
return
refer_values = None
for v in self.iter_values(elem, namespaces):
if isinstance(v, XMLSchemaValidationError):
yield v
continue
if refer_values is None:
try:
refer_values = self.get_refer_values(elem, namespaces)
except XMLSchemaValueError as err:
yield XMLSchemaValidationError(self, elem, str(err))
continue
if v not in refer_values:
reason = "Key {!r} with value {!r} not found for identity constraint of element {!r}." \
.format(self.prefixed_name, v, qname_to_prefixed(elem.tag, self.namespaces))
yield XMLSchemaValidationError(validator=self, obj=elem, reason=reason)
class Xsd11Unique(XsdUnique):
def _parse(self):
if self._parse_reference():
super(XsdIdentity, self)._parse()
self.ref = True
else:
super(Xsd11Unique, self)._parse()
class Xsd11Key(XsdKey):
def _parse(self):
if self._parse_reference():
super(XsdIdentity, self)._parse()
self.ref = True
else:
super(Xsd11Key, self)._parse()
class Xsd11Keyref(XsdKeyref):
def _parse(self):
if self._parse_reference():
super(XsdIdentity, self)._parse()
self.ref = True
else:
super(Xsd11Keyref, self)._parse()