Source code for mwparserfromhell.parser.tokens

# Copyright (C) 2012-2020 Ben Kurtovic <ben.kurtovic@gmail.com>
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

"""
This module contains the token definitions that are used as an intermediate
parsing data type - they are stored in a flat list, with each token being
identified by its type and optional attributes. The token list is generated in
a syntactically valid form by the :class:`.Tokenizer`, and then converted into
the :class`.Wikicode` tree by the :class:`.Builder`.
"""

__all__ = ["Token"]


[docs] class Token(dict): """A token stores the semantic meaning of a unit of wikicode.""" def __repr__(self): args = [] for key, value in self.items(): if isinstance(value, str) and len(value) > 100: args.append(key + "=" + repr(value[:97] + "...")) else: args.append(key + "=" + repr(value)) return "{}({})".format(type(self).__name__, ", ".join(args)) def __eq__(self, other): return isinstance(other, type(self)) and dict.__eq__(self, other) def __ne__(self, other): return not self.__eq__(other) def __getattr__(self, key): return self.get(key) def __setattr__(self, key, value): self[key] = value def __delattr__(self, key): del self[key]
def make(name): """Create a new Token class using ``type()`` and add it to ``__all__``.""" __all__.append(name) return type(name, (Token,), {}) Text = make("Text") TemplateOpen = make("TemplateOpen") # {{ TemplateParamSeparator = make("TemplateParamSeparator") # | TemplateParamEquals = make("TemplateParamEquals") # = TemplateClose = make("TemplateClose") # }} ArgumentOpen = make("ArgumentOpen") # {{{ ArgumentSeparator = make("ArgumentSeparator") # | ArgumentClose = make("ArgumentClose") # }}} WikilinkOpen = make("WikilinkOpen") # [[ WikilinkSeparator = make("WikilinkSeparator") # | WikilinkClose = make("WikilinkClose") # ]] ExternalLinkOpen = make("ExternalLinkOpen") # [ ExternalLinkSeparator = make("ExternalLinkSeparator") # ExternalLinkClose = make("ExternalLinkClose") # ] HTMLEntityStart = make("HTMLEntityStart") # & HTMLEntityNumeric = make("HTMLEntityNumeric") # # HTMLEntityHex = make("HTMLEntityHex") # x HTMLEntityEnd = make("HTMLEntityEnd") # ; HeadingStart = make("HeadingStart") # =... HeadingEnd = make("HeadingEnd") # =... CommentStart = make("CommentStart") # <!-- CommentEnd = make("CommentEnd") # --> TagOpenOpen = make("TagOpenOpen") # < TagAttrStart = make("TagAttrStart") TagAttrEquals = make("TagAttrEquals") # = TagAttrQuote = make("TagAttrQuote") # ", ' TagCloseOpen = make("TagCloseOpen") # > TagCloseSelfclose = make("TagCloseSelfclose") # /> TagOpenClose = make("TagOpenClose") # </ TagCloseClose = make("TagCloseClose") # > del make