| import functools
|
| import string
|
| import sys
|
| import typing as t
|
|
|
| if t.TYPE_CHECKING:
|
| import typing_extensions as te
|
|
|
| class HasHTML(te.Protocol):
|
| def __html__(self) -> str:
|
| pass
|
|
|
| _P = te.ParamSpec("_P")
|
|
|
|
|
| __version__ = "2.1.5"
|
|
|
|
|
| def _simple_escaping_wrapper(func: "t.Callable[_P, str]") -> "t.Callable[_P, Markup]":
|
| @functools.wraps(func)
|
| def wrapped(self: "Markup", *args: "_P.args", **kwargs: "_P.kwargs") -> "Markup":
|
| arg_list = _escape_argspec(list(args), enumerate(args), self.escape)
|
| _escape_argspec(kwargs, kwargs.items(), self.escape)
|
| return self.__class__(func(self, *arg_list, **kwargs))
|
|
|
| return wrapped
|
|
|
|
|
| class Markup(str):
|
| """A string that is ready to be safely inserted into an HTML or XML
|
| document, either because it was escaped or because it was marked
|
| safe.
|
|
|
| Passing an object to the constructor converts it to text and wraps
|
| it to mark it safe without escaping. To escape the text, use the
|
| :meth:`escape` class method instead.
|
|
|
| >>> Markup("Hello, <em>World</em>!")
|
| Markup('Hello, <em>World</em>!')
|
| >>> Markup(42)
|
| Markup('42')
|
| >>> Markup.escape("Hello, <em>World</em>!")
|
| Markup('Hello <em>World</em>!')
|
|
|
| This implements the ``__html__()`` interface that some frameworks
|
| use. Passing an object that implements ``__html__()`` will wrap the
|
| output of that method, marking it safe.
|
|
|
| >>> class Foo:
|
| ... def __html__(self):
|
| ... return '<a href="/foo">foo</a>'
|
| ...
|
| >>> Markup(Foo())
|
| Markup('<a href="/foo">foo</a>')
|
|
|
| This is a subclass of :class:`str`. It has the same methods, but
|
| escapes their arguments and returns a ``Markup`` instance.
|
|
|
| >>> Markup("<em>%s</em>") % ("foo & bar",)
|
| Markup('<em>foo & bar</em>')
|
| >>> Markup("<em>Hello</em> ") + "<foo>"
|
| Markup('<em>Hello</em> <foo>')
|
| """
|
|
|
| __slots__ = ()
|
|
|
| def __new__(
|
| cls, base: t.Any = "", encoding: t.Optional[str] = None, errors: str = "strict"
|
| ) -> "te.Self":
|
| if hasattr(base, "__html__"):
|
| base = base.__html__()
|
|
|
| if encoding is None:
|
| return super().__new__(cls, base)
|
|
|
| return super().__new__(cls, base, encoding, errors)
|
|
|
| def __html__(self) -> "te.Self":
|
| return self
|
|
|
| def __add__(self, other: t.Union[str, "HasHTML"]) -> "te.Self":
|
| if isinstance(other, str) or hasattr(other, "__html__"):
|
| return self.__class__(super().__add__(self.escape(other)))
|
|
|
| return NotImplemented
|
|
|
| def __radd__(self, other: t.Union[str, "HasHTML"]) -> "te.Self":
|
| if isinstance(other, str) or hasattr(other, "__html__"):
|
| return self.escape(other).__add__(self)
|
|
|
| return NotImplemented
|
|
|
| def __mul__(self, num: "te.SupportsIndex") -> "te.Self":
|
| if isinstance(num, int):
|
| return self.__class__(super().__mul__(num))
|
|
|
| return NotImplemented
|
|
|
| __rmul__ = __mul__
|
|
|
| def __mod__(self, arg: t.Any) -> "te.Self":
|
| if isinstance(arg, tuple):
|
|
|
| arg = tuple(_MarkupEscapeHelper(x, self.escape) for x in arg)
|
| elif hasattr(type(arg), "__getitem__") and not isinstance(arg, str):
|
|
|
| arg = _MarkupEscapeHelper(arg, self.escape)
|
| else:
|
|
|
| arg = (_MarkupEscapeHelper(arg, self.escape),)
|
|
|
| return self.__class__(super().__mod__(arg))
|
|
|
| def __repr__(self) -> str:
|
| return f"{self.__class__.__name__}({super().__repr__()})"
|
|
|
| def join(self, seq: t.Iterable[t.Union[str, "HasHTML"]]) -> "te.Self":
|
| return self.__class__(super().join(map(self.escape, seq)))
|
|
|
| join.__doc__ = str.join.__doc__
|
|
|
| def split(
|
| self, sep: t.Optional[str] = None, maxsplit: int = -1
|
| ) -> t.List["te.Self"]:
|
| return [self.__class__(v) for v in super().split(sep, maxsplit)]
|
|
|
| split.__doc__ = str.split.__doc__
|
|
|
| def rsplit(
|
| self, sep: t.Optional[str] = None, maxsplit: int = -1
|
| ) -> t.List["te.Self"]:
|
| return [self.__class__(v) for v in super().rsplit(sep, maxsplit)]
|
|
|
| rsplit.__doc__ = str.rsplit.__doc__
|
|
|
| def splitlines(
|
| self, keepends: bool = False
|
| ) -> t.List["te.Self"]:
|
| return [self.__class__(v) for v in super().splitlines(keepends)]
|
|
|
| splitlines.__doc__ = str.splitlines.__doc__
|
|
|
| def unescape(self) -> str:
|
| """Convert escaped markup back into a text string. This replaces
|
| HTML entities with the characters they represent.
|
|
|
| >>> Markup("Main » <em>About</em>").unescape()
|
| 'Main » <em>About</em>'
|
| """
|
| from html import unescape
|
|
|
| return unescape(str(self))
|
|
|
| def striptags(self) -> str:
|
| """:meth:`unescape` the markup, remove tags, and normalize
|
| whitespace to single spaces.
|
|
|
| >>> Markup("Main »\t<em>About</em>").striptags()
|
| 'Main » About'
|
| """
|
| value = str(self)
|
|
|
|
|
|
|
|
|
| while True:
|
|
|
| start = value.find("<!--")
|
|
|
| if start == -1:
|
| break
|
|
|
|
|
| end = value.find("-->", start)
|
|
|
| if end == -1:
|
| break
|
|
|
| value = f"{value[:start]}{value[end + 3:]}"
|
|
|
|
|
| while True:
|
| start = value.find("<")
|
|
|
| if start == -1:
|
| break
|
|
|
| end = value.find(">", start)
|
|
|
| if end == -1:
|
| break
|
|
|
| value = f"{value[:start]}{value[end + 1:]}"
|
|
|
|
|
| value = " ".join(value.split())
|
| return self.__class__(value).unescape()
|
|
|
| @classmethod
|
| def escape(cls, s: t.Any) -> "te.Self":
|
| """Escape a string. Calls :func:`escape` and ensures that for
|
| subclasses the correct type is returned.
|
| """
|
| rv = escape(s)
|
|
|
| if rv.__class__ is not cls:
|
| return cls(rv)
|
|
|
| return rv
|
|
|
| __getitem__ = _simple_escaping_wrapper(str.__getitem__)
|
| capitalize = _simple_escaping_wrapper(str.capitalize)
|
| title = _simple_escaping_wrapper(str.title)
|
| lower = _simple_escaping_wrapper(str.lower)
|
| upper = _simple_escaping_wrapper(str.upper)
|
| replace = _simple_escaping_wrapper(str.replace)
|
| ljust = _simple_escaping_wrapper(str.ljust)
|
| rjust = _simple_escaping_wrapper(str.rjust)
|
| lstrip = _simple_escaping_wrapper(str.lstrip)
|
| rstrip = _simple_escaping_wrapper(str.rstrip)
|
| center = _simple_escaping_wrapper(str.center)
|
| strip = _simple_escaping_wrapper(str.strip)
|
| translate = _simple_escaping_wrapper(str.translate)
|
| expandtabs = _simple_escaping_wrapper(str.expandtabs)
|
| swapcase = _simple_escaping_wrapper(str.swapcase)
|
| zfill = _simple_escaping_wrapper(str.zfill)
|
| casefold = _simple_escaping_wrapper(str.casefold)
|
|
|
| if sys.version_info >= (3, 9):
|
| removeprefix = _simple_escaping_wrapper(str.removeprefix)
|
| removesuffix = _simple_escaping_wrapper(str.removesuffix)
|
|
|
| def partition(self, sep: str) -> t.Tuple["te.Self", "te.Self", "te.Self"]:
|
| l, s, r = super().partition(self.escape(sep))
|
| cls = self.__class__
|
| return cls(l), cls(s), cls(r)
|
|
|
| def rpartition(self, sep: str) -> t.Tuple["te.Self", "te.Self", "te.Self"]:
|
| l, s, r = super().rpartition(self.escape(sep))
|
| cls = self.__class__
|
| return cls(l), cls(s), cls(r)
|
|
|
| def format(self, *args: t.Any, **kwargs: t.Any) -> "te.Self":
|
| formatter = EscapeFormatter(self.escape)
|
| return self.__class__(formatter.vformat(self, args, kwargs))
|
|
|
| def format_map(
|
| self, map: t.Mapping[str, t.Any]
|
| ) -> "te.Self":
|
| formatter = EscapeFormatter(self.escape)
|
| return self.__class__(formatter.vformat(self, (), map))
|
|
|
| def __html_format__(self, format_spec: str) -> "te.Self":
|
| if format_spec:
|
| raise ValueError("Unsupported format specification for Markup.")
|
|
|
| return self
|
|
|
|
|
| class EscapeFormatter(string.Formatter):
|
| __slots__ = ("escape",)
|
|
|
| def __init__(self, escape: t.Callable[[t.Any], Markup]) -> None:
|
| self.escape = escape
|
| super().__init__()
|
|
|
| def format_field(self, value: t.Any, format_spec: str) -> str:
|
| if hasattr(value, "__html_format__"):
|
| rv = value.__html_format__(format_spec)
|
| elif hasattr(value, "__html__"):
|
| if format_spec:
|
| raise ValueError(
|
| f"Format specifier {format_spec} given, but {type(value)} does not"
|
| " define __html_format__. A class that defines __html__ must define"
|
| " __html_format__ to work with format specifiers."
|
| )
|
| rv = value.__html__()
|
| else:
|
|
|
|
|
| rv = string.Formatter.format_field(self, value, str(format_spec))
|
| return str(self.escape(rv))
|
|
|
|
|
| _ListOrDict = t.TypeVar("_ListOrDict", list, dict)
|
|
|
|
|
| def _escape_argspec(
|
| obj: _ListOrDict, iterable: t.Iterable[t.Any], escape: t.Callable[[t.Any], Markup]
|
| ) -> _ListOrDict:
|
| """Helper for various string-wrapped functions."""
|
| for key, value in iterable:
|
| if isinstance(value, str) or hasattr(value, "__html__"):
|
| obj[key] = escape(value)
|
|
|
| return obj
|
|
|
|
|
| class _MarkupEscapeHelper:
|
| """Helper for :meth:`Markup.__mod__`."""
|
|
|
| __slots__ = ("obj", "escape")
|
|
|
| def __init__(self, obj: t.Any, escape: t.Callable[[t.Any], Markup]) -> None:
|
| self.obj = obj
|
| self.escape = escape
|
|
|
| def __getitem__(self, item: t.Any) -> "te.Self":
|
| return self.__class__(self.obj[item], self.escape)
|
|
|
| def __str__(self) -> str:
|
| return str(self.escape(self.obj))
|
|
|
| def __repr__(self) -> str:
|
| return str(self.escape(repr(self.obj)))
|
|
|
| def __int__(self) -> int:
|
| return int(self.obj)
|
|
|
| def __float__(self) -> float:
|
| return float(self.obj)
|
|
|
|
|
|
|
| try:
|
| from ._speedups import escape as escape
|
| from ._speedups import escape_silent as escape_silent
|
| from ._speedups import soft_str as soft_str
|
| except ImportError:
|
| from ._native import escape as escape
|
| from ._native import escape_silent as escape_silent
|
| from ._native import soft_str as soft_str
|
|
|