import abc import collections import html import io import re from codecs import open from sys import version_info from xml import sax from xml.dom import minidom as dom from xml.sax import SAXParseException from kajiki import ir, template from kajiki.doctype import DocumentTypeDeclaration, extract_dtd from kajiki.html_utils import HTML_CDATA_TAGS, HTML_OPTIONAL_END_TAGS, HTML_REQUIRED_END_TAGS from kajiki.markup_template import QDIRECTIVES, QDIRECTIVES_DICT impl = dom.getDOMImplementation(" ") def XMLTemplate( # noqa: N802 source=None, filename=None, mode=None, is_fragment=False, # noqa: FBT002 encoding="utf-8", autoblocks=None, cdata_scripts=True, # noqa: FBT002 strip_text=False, # noqa: FBT002 base_globals=None, ): """Given XML source code of a Kajiki Templates parses and returns a template class. The source code is parsed to its DOM representation by :class:`._Parser`, which is then expanded to separate directives from tags by :class:`._DomTransformer` and then compiled to the *Intermediate Representation* tree by :class:`._Compiler`. The *Intermediate Representation* generates the Python code which creates a new :class:`kajiki.template._Template` subclass through :meth:`kajiki.template.Template`. The generated code is then executed to return the newly created class. Calling ``.render()`` on an instance of the generate class will then render the template. """ if source is None: with open(filename, encoding=encoding) as f: source = f.read() # source is a unicode string if filename is None: filename = "" doc = _Parser(filename, source).parse() doc = _DomTransformer(doc, strip_text=strip_text).transform() ir_ = _Compiler( filename, doc, mode=mode, is_fragment=is_fragment, autoblocks=autoblocks, cdata_scripts=cdata_scripts, ).compile() return template.from_ir(ir_, base_globals=base_globals) def annotate(gen): def inner(self, node, *args, **kwargs): for x in gen(self, node, *args, **kwargs): self._anno(node, x) yield x return inner class _Compiler: """Compiles a DOM tree into IR :class:`kajiki.ir.TemplateNode`. Intermediate Representation is a tree of nodes that represent Python Code that should be generated to execute the template. """ def __init__( self, filename, doc, mode=None, is_fragment=False, # noqa: FBT002 autoblocks=None, cdata_scripts=True, # noqa: FBT002 ): self.filename = filename self.doc = doc self.is_fragment = is_fragment self.functions = collections.defaultdict(list) self.functions["__main__()"] = [] self.function_lnos = {} self.mod_py = [] self.autoblocks = autoblocks or [] self.cdata_scripts = cdata_scripts self.in_def = False self.is_child = False # The rendering mode is either specified in the *mode* argument, # or inferred from the DTD: self._dtd = DocumentTypeDeclaration.matching(self.doc._dtd) # noqa: SLF001 if mode: self.mode = mode elif self._dtd: self.mode = self._dtd.rendering_mode else: # The template might contain an unknown DTD self.mode = "xml" # by default def compile(self): """Compile the document provided by :class:`._Parser`. Returns as :class:`kajiki.ir.TemplateNode` instance representing the whole tree of nodes as their intermediate representation. The returned template will include at least a ``__main__`` function which is the document itself including a DOCTYPE and any function declared through ``py:def`` or as a ``py:block``. The ``TemplateNode`` will also include the module level code specified through ``" else: dtd = None if dtd: dtd = ir.TextNode(dtd.strip() + "\n") dtd.filename = self.filename dtd.lineno = 1 body.insert(0, dtd) self.functions["__main__()"] = body defs = [] for k, v in self.functions.items(): node = ir.DefNode(k, *v) node.lineno = self.function_lnos.get(k) defs.append(node) node = ir.TemplateNode(self.mod_py, defs) node.filename = self.filename node.lineno = 0 return node def _anno(self, dom_node, ir_node): if ir_node.lineno: return ir_node.filename = self.filename ir_node.lineno = dom_node.lineno def _is_autoblock(self, node): if node.tagName not in self.autoblocks: return False if node.hasAttribute("py:autoblock"): guard = node.getAttribute("py:autoblock").lower() if guard not in ("false", "true"): msg = "py:autoblock is evaluated at compile time " "and only accepts True/False constants" raise ValueError(msg) if guard == "false": # We throw away the attribute so it doesn't remain in rendered nodes. node.removeAttribute("py:autoblock") return False return True def _compile_node(self, node): """Convert a DOM node to its intermediate representation. Calls specific compile functions for special nodes and any directive that was expanded by :meth:`._DomTransformer._expand_directives`. For any plain XML node forward it to :meth:`._compile_xml`. Automatically converts any ``autoblock`` node to a ``py:block`` directive. """ if isinstance(node, dom.Comment): return self._compile_comment(node) if isinstance(node, dom.Text): return self._compile_text(node) if isinstance(node, dom.ProcessingInstruction): return self._compile_pi(node) if self._is_autoblock(node): # Set the name of the block equal to the tag itself. node.setAttribute("name", node.tagName) return self._compile_block(node) if node.tagName.startswith("py:"): # Handle directives compiler = getattr(self, "_compile_{}".format(node.tagName.split(":")[-1]), self._compile_xml) return compiler(node) return self._compile_xml(node) @annotate def _compile_xml(self, node): """Compile plain XML nodes. When compiling a node also take care of directives that only modify the node itself (``py:strip``, ``py:attrs`` and ``py:content``) as all directives wrapping the node and its children have already been handled by :meth:`._compile_node`. The provided intermediate representations include the node itself, its attributes and its content. Attributes of the node are handled through :class:`._TextCompiler` to ensure ${expr} expressions are handled in attributes too. In case the node has children (and no py:content) compile the children too. """ content = attrs = guard = None if node.hasAttribute("py:strip"): guard = node.getAttribute("py:strip") if guard == "": # py:strip="" means yes, do strip the tag # noqa: SIM108 guard = "False" else: guard = f"not ({guard})" node.removeAttribute("py:strip") yield ir.TextNode(f"<{node.tagName}", guard) for k, v in sorted(node.attributes.items()): tc = _TextCompiler( self.filename, v, node.lineno, ir.TextNode, in_html_attr=True, compiler_instance=self, ) v = list(tc) # noqa: PLW2901 if k == "py:content": content = node.getAttribute("py:content") continue elif k == "py:attrs": attrs = node.getAttribute("py:attrs") continue yield ir.AttrNode(k, v, guard, self.mode) if attrs: yield ir.AttrsNode(attrs, guard, self.mode) if content: yield ir.TextNode(">", guard) yield ir.ExprNode(content) yield ir.TextNode(f"", guard) elif node.childNodes: yield ir.TextNode(">", guard) if self.cdata_scripts and node.tagName in HTML_CDATA_TAGS: # Special behaviour for