1   
  2   
  3   
  4   
  5   
  6   
  7   
  8   
  9   
 10   
 11   
 12   
 13   
 14   
 15   
 16  """Classes and global objects related to resolving U{XML 
 17  Namespaces<http://www.w3.org/TR/2006/REC-xml-names-20060816/index.html>}.""" 
 18   
 19  import pyxb 
 20  import pyxb.utils.utility 
 21  from pyxb.namespace import archive, utility 
 22  import logging 
 23   
 24  _log = logging.getLogger(__name__) 
 27      """Mix-in indicating that this object may have references to unseen named components. 
 28   
 29      This class is mixed-in to those XMLSchema components that have a reference 
 30      to another component that is identified by a QName.  Resolution of that 
 31      component may need to be delayed if the definition of the component has 
 32      not yet been read. 
 33      """ 
 34   
 35       
 36      _TraceResolution = False 
 37   
 39          """Determine whether this named component is resolved. 
 40   
 41          Override this in the child class.""" 
 42          raise NotImplementedError("_Resolvable_mixin.isResolved in %s"% (type(self).__name__,)) 
  43       
 45          """Perform whatever steps are required to resolve this component. 
 46   
 47          Resolution is performed in the context of the namespace to which the 
 48          component belongs.  Invoking this method may fail to complete the 
 49          resolution process if the component itself depends on unresolved 
 50          components.  The sole caller of this should be 
 51          L{_NamespaceResolution_mixin.resolveDefinitions}. 
 52           
 53          This method is permitted (nay, encouraged) to raise an exception if 
 54          resolution requires interpreting a QName and the named component 
 55          cannot be found. 
 56   
 57          Override this in the child class.  In the prefix, if L{isResolved} is 
 58          true, return right away.  If something prevents you from completing 
 59          resolution, invoke L{self._queueForResolution()} (so it is retried 
 60          later) and immediately return self.  Prior to leaving after successful 
 61          resolution discard any cached dom node by setting C{self.__domNode=None}. 
 62   
 63          @return: C{self}, whether or not resolution succeeds. 
 64          @raise pyxb.SchemaValidationError: if resolution requlres a reference to an unknown component 
 65          """ 
 66          raise NotImplementedError("_Resolvable_mixin._resolve in %s"% (type(self).__name__,)) 
  67   
 69          """Short-hand to requeue an object if the class implements _namespaceContext(). 
 70          """ 
 71          if (why is not None) and self._TraceResolution: 
 72              _log.info('Resolution delayed for %s: %s\n\tDepends on: %s', self, why, depends_on) 
 73          self._namespaceContext().queueForResolution(self, depends_on) 
   74   
 76      """Mix-in that aggregates those aspects of XMLNamespaces relevant to 
 77      resolving component references. 
 78      """ 
 79   
 80       
 81       
 82      __importedNamespaces = None 
 83   
 84       
 85       
 86      __referencedNamespaces = None 
 87   
 88       
 89       
 90      __unresolvedComponents = None 
 91   
 92       
 93       
 94       
 95      __unresolvedDependents = None 
 96   
106   
113   
118   
122   
127   
129          """Return the set of namespaces which some schema imported while 
130          processing with this namespace as target.""" 
131          return frozenset(self.__importedNamespaces) 
 132   
137           
139          """Return the set of namespaces which appear in namespace declarations 
140          of schema with this namespace as target.""" 
141          return frozenset(self.__referencedNamespaces) 
 142   
144          """Invoked to note that a component may have references that will need 
145          to be resolved. 
146   
147          Newly created named components are often unresolved, as are components 
148          which, in the course of resolution, are found to depend on another 
149          unresolved component. 
150   
151          @param resolvable: An instance of L{_Resolvable_mixin} that is later to 
152          be resolved. 
153   
154          @keyword depends_on: C{None}, or an instance of L{_Resolvable_mixin} 
155          which C{resolvable} requires to be resolved in order to resolve 
156          itself. 
157           
158          @return: C{resolvable} 
159          """ 
160          assert isinstance(resolvable, _Resolvable_mixin) 
161          if not resolvable.isResolved(): 
162              assert depends_on is None or isinstance(depends_on, _Resolvable_mixin) 
163              self.__unresolvedComponents.append(resolvable) 
164              if depends_on is not None and not depends_on.isResolved(): 
165                  from pyxb.xmlschema import structures 
166                  assert isinstance(depends_on, _Resolvable_mixin) 
167                  assert isinstance(depends_on, structures._NamedComponent_mixin) 
168                  self.__unresolvedDependents.setdefault(resolvable, set()).add(depends_on) 
169          return resolvable 
 170   
172          """Return C{True} iff this namespace has not been resolved.""" 
173          return self.__unresolvedComponents is not None 
 174   
193   
195          """Loop until all references within the associated resolvable objects 
196          have been resolved. 
197   
198          This method iterates through all components on the unresolved list, 
199          invoking the _resolve method of each.  If the component could not be 
200          resolved in this pass, it iis placed back on the list for the next 
201          iteration.  If an iteration completes without resolving any of the 
202          unresolved components, a pyxb.NotInNamespaceError exception is raised. 
203   
204          @note: Do not invoke this until all top-level definitions for the 
205          namespace have been provided.  The resolution routines are entitled to 
206          raise a validation exception if a reference to an unrecognized 
207          component is encountered. 
208          """ 
209          if not self.needsResolution(): 
210              return True 
211           
212          while 0 < len(self.__unresolvedComponents): 
213               
214               
215               
216              unresolved = self.__unresolvedComponents 
217               
218              self.__unresolvedComponents = [] 
219              self.__unresolvedDependents = {} 
220              for resolvable in unresolved: 
221                   
222                  resolvable._resolve() 
223   
224                   
225                  assert resolvable.isResolved() or (resolvable in self.__unresolvedComponents), 'Lost resolvable %s' % (resolvable,) 
226   
227                   
228                   
229                   
230                   
231                  if (resolvable.isResolved() and (resolvable._clones() is not None)): 
232                      assert False 
233              if self.__unresolvedComponents == unresolved: 
234                  if allow_unresolved: 
235                      return False 
236                   
237                   
238                   
239                  failed_components = [] 
240                  from pyxb.xmlschema import structures 
241                  for d in self.__unresolvedComponents: 
242                      if isinstance(d, structures._NamedComponent_mixin): 
243                          failed_components.append('%s named %s' % (d.__class__.__name__, d.name())) 
244                      else: 
245                          failed_components.append('Anonymous %s' % (d.__class__.__name__,)) 
246                  raise pyxb.NotInNamespaceError('Infinite loop in resolution:\n  %s' % ("\n  ".join(failed_components),)) 
247   
248           
249           
250          self.__unresolvedComponents = None 
251          self.__unresolvedDependents = None 
252   
253           
254           
255           
256           
257           
258          self._releaseNamespaceContexts() 
259   
260          return True 
 261       
265   
267          """Returns a map from unresolved components to sets of components that 
268          must be resolved first.""" 
269          return self.__unresolvedDependents 
  270   
272      """Resolve all components in the sibling_namespaces. 
273   
274      @param sibling_namespaces : A set of namespaces expected to be closed 
275      under dependency.""" 
276       
277      for ns in sibling_namespaces: 
278          ns.configureCategories([archive.NamespaceArchive._AnonymousCategory()]) 
279          ns.validateComponentModel() 
280   
281      def cmp_for_deps (ns1, ns2): 
282          """Sort namespaces so dependencies get resolved first""" 
283          if ns2 not in dependency_map.get(ns1, set()): 
284              return -1 
285          if ns1 not in dependency_map.get(ns2, set()): 
286              return 1 
287          return 0 
 288   
289      need_resolved_set = set(sibling_namespaces) 
290      dependency_map = {} 
291      last_state = None 
292      while need_resolved_set: 
293          need_resolved_list = list(need_resolved_set) 
294          if dependency_map: 
295              need_resolved_list.sort(cmp_for_deps) 
296          need_resolved_set = set() 
297          dependency_map = {} 
298          for ns in need_resolved_list: 
299              if not ns.needsResolution(): 
300                  continue 
301              if not ns.resolveDefinitions(allow_unresolved=True): 
302                  deps = dependency_map.setdefault(ns, set()) 
303                  for (c, dcs) in ns._unresolvedDependents().iteritems(): 
304                      for dc in dcs: 
305                          dns = dc.expandedName().namespace() 
306                          if dns != ns: 
307                              deps.add(dns) 
308                  _log.info('Holding incomplete resolution %s depending on: ', ns.uri(), u' ; '.join([ unicode(_dns) for _dns in deps ])) 
309                  need_resolved_set.add(ns) 
310           
311           
312           
313           
314           
315          state = [] 
316          for ns in need_resolved_set: 
317              state.append( (ns, len(ns._unresolvedComponents())) ) 
318          state = tuple(state) 
319          if last_state == state: 
320              raise pyxb.LogicError('Unexpected external dependency in sibling namespaces: %s' % (u"\n  ".join( [unicode(_ns) for _ns in need_resolved_set ]),)) 
321          last_state = state 
322   
323 -class NamespaceContext (object): 
 324      """Records information associated with namespaces at a DOM node. 
325      """ 
326   
327 -    def __str__ (self): 
 328          rv = [ u'NamespaceContext ' ] 
329          if self.defaultNamespace() is not None: 
330              rv.extend([ '(defaultNamespace=', unicode(self.defaultNamespace()), ') ']) 
331          if self.targetNamespace() is not None: 
332              rv.extend([ '(targetNamespace=', unicode(self.targetNamespace()), ') ']) 
333          rv.append("\n") 
334          for (pfx, ns) in self.inScopeNamespaces().items(): 
335              if pfx is not None: 
336                  rv.append('  xmlns:%s=%s' % (pfx, unicode(ns))) 
337          return u''.join(rv) 
 338   
339      __TargetNamespaceAttributes = { } 
340      @classmethod 
341 -    def _AddTargetNamespaceAttribute (cls, expanded_name, attribute_name): 
 344      @classmethod 
345 -    def _TargetNamespaceAttribute (cls, expanded_name): 
 347   
348       
349       
350      __pendingReferencedNamespaces = None 
351       
352 -    def defaultNamespace (self): 
 353          """The default namespace in effect at this node.  E.g., C{xmlns="URN:default"}.""" 
354          return self.__defaultNamespace 
 355      __defaultNamespace = None 
356   
357       
358       
359       
360       
361       
362       
363      __fallbackToTargetNamespace = False 
364   
365 -    def targetNamespace (self): 
 366          """The target namespace in effect at this node.  Usually from the 
367          C{targetNamespace} attribute.  If no namespace is specified for the 
368          schema, an absent namespace was assigned upon creation and will be 
369          returned.""" 
370          return self.__targetNamespace 
 371      __targetNamespace = None 
372   
374          """Map from prefix strings to L{Namespace} instances associated with those 
375          prefixes.  The prefix C{None} identifies the default namespace.""" 
376          return self.__inScopeNamespaces 
 377      __inScopeNamespaces = None 
378   
379 -    def prefixForNamespace (self, namespace): 
 380          """Return a prefix associated with the given namespace in this 
381          context, or None if the namespace is the default or is not in 
382          scope.""" 
383          for (pfx, ns) in self.__inScopeNamespaces.items(): 
384              if namespace == ns: 
385                  return pfx 
386          return None 
 387   
388      @classmethod 
389 -    def GetNodeContext (cls, node, **kw): 
 390          """Get the L{NamespaceContext} instance that was assigned to the node. 
391   
392          If none has been assigned and keyword parameters are present, create 
393          one treating this as the root node and the keyword parameters as 
394          configuration information (e.g., default_namespace). 
395   
396          @raise pyxb.LogicError: no context is available and the keywords 
397          required to create one were not provided 
398          """ 
399          try: 
400              return node.__namespaceContext 
401          except AttributeError: 
402              return NamespaceContext(node, **kw) 
 403   
404 -    def setNodeContext (self, node): 
 406   
407 -    def processXMLNS (self, prefix, uri): 
 408          if not self.__mutableInScopeNamespaces: 
409              self.__inScopeNamespaces = self.__inScopeNamespaces.copy() 
410              self.__mutableInScopeNamespaces = True 
411          if uri: 
412              if prefix is None: 
413                  ns = self.__defaultNamespace = utility.NamespaceForURI(uri, create_if_missing=True) 
414                  self.__inScopeNamespaces[None] = self.__defaultNamespace 
415              else: 
416                  ns = utility.NamespaceForURI(uri, create_if_missing=True) 
417                  self.__inScopeNamespaces[prefix] = ns 
418                   
419                   
420                   
421                   
422                   
423              if self.__targetNamespace: 
424                  self.__targetNamespace._referenceNamespace(ns) 
425              else: 
426                  self.__pendingReferencedNamespaces.add(ns) 
427          else: 
428               
429               
430               
431               
432               
433              if prefix is not None: 
434                  raise pyxb.NamespaceError(self, 'Attempt to undefine non-default namespace %s' % (prefix,)) 
435              self.__inScopeNamespaces.pop(prefix, None) 
436              self.__defaultNamespace = None 
 437   
438 -    def finalizeTargetNamespace (self, tns_uri=None, including_context=None): 
 439          if tns_uri is not None: 
440              assert 0 < len(tns_uri) 
441               
442               
443               
444               
445               
446              self.__targetNamespace = utility.NamespaceForURI(tns_uri, create_if_missing=True) 
447          elif self.__targetNamespace is None: 
448              if including_context is not None: 
449                  self.__targetNamespace = including_context.targetNamespace() 
450                  self.__fallbackToTargetNamespace = True 
451              elif tns_uri is None: 
452                  self.__targetNamespace = utility.CreateAbsentNamespace() 
453              else: 
454                  self.__targetNamespace = utility.NamespaceForURI(tns_uri, create_if_missing=True) 
455          if self.__pendingReferencedNamespaces is not None: 
456              [ self.__targetNamespace._referenceNamespace(_ns) for _ns in self.__pendingReferencedNamespaces ] 
457              self.__pendingReferencedNamespace = None 
458          assert self.__targetNamespace is not None 
459          if (not self.__fallbackToTargetNamespace) and self.__targetNamespace.isAbsentNamespace(): 
460              self.__fallbackToTargetNamespace = True 
 461   
462 -    def __init__ (self, 
463                    dom_node=None, 
464                    parent_context=None, 
465                    including_context=None, 
466                    recurse=True, 
467                    default_namespace=None, 
468                    target_namespace=None, 
469                    in_scope_namespaces=None, 
470                    expanded_name=None, 
471                    finalize_target_namespace=True):   
 472          """Determine the namespace context that should be associated with the 
473          given node and, optionally, its element children. 
474   
475          @param dom_node: The DOM node 
476          @type dom_node: C{xml.dom.Element} 
477          @keyword parent_context: Optional value that specifies the context 
478          associated with C{dom_node}'s parent node.  If not provided, only the 
479          C{xml} namespace is in scope. 
480          @type parent_context: L{NamespaceContext} 
481          @keyword recurse: If True (default), create namespace contexts for all 
482          element children of C{dom_node} 
483          @type recurse: C{bool} 
484          @keyword default_namespace: Optional value to set as the default 
485          namespace.  Values from C{parent_context} would override this, as 
486          would an C{xmlns} attribute in the C{dom_node}. 
487          @type default_namespace: L{NamespaceContext} 
488          @keyword target_namespace: Optional value to set as the target 
489          namespace.  Values from C{parent_context} would override this, as 
490          would a C{targetNamespace} attribute in the C{dom_node} 
491          @type target_namespace: L{NamespaceContext} 
492          @keyword in_scope_namespaces: Optional value to set as the initial set 
493          of in-scope namespaces.  The always-present namespaces are added to 
494          this if necessary. 
495          @type in_scope_namespaces: C{dict} mapping C{string} to L{Namespace}. 
496          """ 
497          from pyxb.namespace import builtin 
498   
499          if dom_node is not None: 
500              try: 
501                  assert dom_node.__namespaceContext is None 
502              except AttributeError: 
503                  pass 
504              dom_node.__namespaceContext = self 
505   
506          self.__defaultNamespace = default_namespace 
507          self.__targetNamespace = target_namespace 
508          self.__inScopeNamespaces = builtin._UndeclaredNamespaceMap 
509          self.__mutableInScopeNamespaces = False 
510   
511          if in_scope_namespaces is not None: 
512              if parent_context is not None: 
513                  raise pyxb.LogicError('Cannot provide both parent_context and in_scope_namespaces') 
514              self.__inScopeNamespaces = builtin._UndeclaredNamespaceMap.copy() 
515              self.__inScopeNamespaces.update(in_scope_namespaces) 
516              self.__mutableInScopeNamespaces = True 
517           
518          if parent_context is not None: 
519              self.__inScopeNamespaces = parent_context.inScopeNamespaces() 
520              self.__mutableInScopeNamespaces = False 
521              self.__defaultNamespace = parent_context.defaultNamespace() 
522              self.__targetNamespace = parent_context.targetNamespace() 
523              self.__fallbackToTargetNamespace = parent_context.__fallbackToTargetNamespace 
524               
525          if self.__targetNamespace is None: 
526              self.__pendingReferencedNamespaces = set() 
527          attribute_map = {} 
528          if dom_node is not None: 
529              if expanded_name is None: 
530                  expanded_name = pyxb.namespace.ExpandedName(dom_node) 
531              for ai in range(dom_node.attributes.length): 
532                  attr = dom_node.attributes.item(ai) 
533                  if builtin.XMLNamespaces.uri() == attr.namespaceURI: 
534                      prefix = attr.localName 
535                      if 'xmlns' == prefix: 
536                          prefix = None 
537                      self.processXMLNS(prefix, attr.value) 
538                  else: 
539                      if attr.namespaceURI is not None: 
540                          uri = utility.NamespaceForURI(attr.namespaceURI, create_if_missing=True) 
541                          key = pyxb.namespace.ExpandedName(uri, attr.localName) 
542                      else: 
543                          key = pyxb.namespace.ExpandedName(None, attr.localName) 
544                      attribute_map[key] = attr.value 
545           
546          if finalize_target_namespace: 
547              tns_uri = None 
548              tns_attr = self._TargetNamespaceAttribute(expanded_name) 
549              if tns_attr is not None: 
550                  tns_uri = attribute_map.get(tns_attr) 
551                  self.finalizeTargetNamespace(tns_uri, including_context=including_context) 
552   
553           
554           
555           
556          if (dom_node is not None) and recurse: 
557              from xml.dom import Node 
558              assert Node.ELEMENT_NODE == dom_node.nodeType 
559              for cn in dom_node.childNodes: 
560                  if Node.ELEMENT_NODE == cn.nodeType: 
561                      NamespaceContext(cn, self, True) 
 562   
563 -    def interpretQName (self, name, namespace=None): 
 564          """Convert the provided name into an L{ExpandedName}, i.e. a tuple of 
565          L{Namespace} and local name. 
566   
567          If the name includes a prefix, that prefix must map to an in-scope 
568          namespace in this context.  Absence of a prefix maps to 
569          L{defaultNamespace()}, which must be provided (or defaults to the 
570          target namespace, if that is absent). 
571           
572          @param name: A QName. 
573          @type name: C{str} or C{unicode} 
574          @param name: Optional namespace to use for unqualified names when 
575          there is no default namespace.  Note that a defined default namespace, 
576          even if absent, supersedes this value. 
577          @return: An L{ExpandedName} tuple: ( L{Namespace}, C{str} ) 
578          @raise pyxb.SchemaValidationError: The prefix is not in scope 
579          @raise pyxb.SchemaValidationError: No prefix is given and the default namespace is absent 
580          """ 
581          assert isinstance(name, (str, unicode)) 
582          if 0 <= name.find(':'): 
583              (prefix, local_name) = name.split(':', 1) 
584              assert self.inScopeNamespaces() is not None 
585              namespace = self.inScopeNamespaces().get(prefix) 
586              if namespace is None: 
587                  raise pyxb.SchemaValidationError('No namespace declared for QName %s prefix' % (name,)) 
588          else: 
589              local_name = name 
590               
591              if self.defaultNamespace() is not None: 
592                  namespace = self.defaultNamespace() 
593               
594               
595              if (namespace is None) and self.__fallbackToTargetNamespace: 
596                  namespace = self.targetNamespace() 
597              if namespace is None: 
598                  raise pyxb.SchemaValidationError('QName %s with absent default namespace cannot be resolved' % (local_name,)) 
599           
600           
601           
602          if (namespace != self.targetNamespace()): 
603              namespace.validateComponentModel() 
604          return pyxb.namespace.ExpandedName(namespace, local_name) 
 605   
606 -    def queueForResolution (self, component, depends_on=None): 
 607          """Forwards to L{queueForResolution()<Namespace.queueForResolution>} in L{targetNamespace()}.""" 
608          assert isinstance(component, _Resolvable_mixin) 
609          return self.targetNamespace().queueForResolution(component, depends_on) 
 610   
611   
612   
613   
614