alectryon/docutils.py

# Copyright © 2019 Clément Pit-Claudel
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

# pylint: disable=dangerous-default-value,unused-argument

"""reStructuredText support for Alectryon.

This file defines directives that format their contents using Alectryon.

These directives support various arguments to control the appearance of the
output; check out the README for details.

To use them, call ``docutils_support.register()`` before running your
reStructuredText to HTML converter.  The generated code relies on CSS classes
defined in the ``assets/alectryon.css`` file.

A checkbox and an accompanying label (with classes ``alectryon-toggle`` and
``alectryon-toggle-label``) allowing users to reveal all goals and responses at
once is automatically added right before the document's first paragraph.  You
can change its location by inserting an explicit ``.. alectryon-toggle::``
directive in your document, and you can ommit it entirely by setting
``AlectryonTransform.auto_toggle`` to ``False`` (to make styling easier, all
contents following the checkbox are wrapped in a container with class
``alectryon-container``).

To replace Pygments' default highlighters with Alectryon's
everywhere, call ``alectryon.pygments.replace_builtin_lexer()``.

If you write lots of inline code snippets, consider calling ``set_default_role``,
which will set the default role to ``:coq:``.

For convenience, ``alectryon.docutils.setup()`` can be used to perform all the
steps above at once.

A note on transforms: Sphinx has a nice API (``app.add_node``) for adding new
node types, so you can write visitors for each output format without creating
new translators.  Docutils doesn't have such an API: it forces you to subclass
the default translator instead, which is a pain.  The alternative is to use a
transform to replace custom nodes with "raw" nodes, but even this is non-trivial
because the transform doesn't know which output format the document uses.

To work around this issue we use a writer-dependent transform on the docutils
side, and a doctree-resolved event on the Sphinx side.
"""

from typing import Any, ClassVar, DefaultDict, Dict, Iterable, List, Tuple, Type

import re
import os.path
from copy import deepcopy
from collections import namedtuple, defaultdict
from importlib import import_module

import docutils
import docutils.frontend
import docutils.transforms
import docutils.utils
import docutils.writers
from docutils import nodes

from docutils.parsers.rst import directives, roles, states, Directive # type: ignore
from docutils.parsers.rst.directives.body import Topic # type: ignore
from docutils.parsers.rst.directives.misc import Role # type: ignore
from docutils.readers.standalone import Reader as StandaloneReader
from docutils.transforms import Transform
from docutils.writers import html4css1, html5_polyglot, latex2e, xetex

from . import core, transforms, html, latex, markers
from .core import Gensym, Position, PosStr
from .pygments import make_highlighter, added_tokens, validate_style, \
    get_lexer, resolve_token, replace_builtin_lexers

# reST extensions
# ===============

def set_line(node, lineno, sm):
    node.source, node.line = sm.get_source_and_line(lineno)

# Nodes
# -----

class alectryon_pending(nodes.pending):
    pass

class alectryon_pending_toggle(nodes.pending):
    pass

class alectryon_pending_mref(nodes.pending):
    pass

class alectryon_pending_io(nodes.pending):
    pass

class alectryon_pending_quote(nodes.pending):
    pass

# Transforms
# ----------

TOGGLE_HTML = """
<input type="checkbox" class="alectryon-toggle" id="alectryon-toggle-{id}" />
<label for="alectryon-toggle-{id}" class="alectryon-toggle-label">
Display all goals and responses
</label>""".replace('\n', '')

LONG_LINE_THRESHOLD = 72
"""Threshold above which to warn about long lines."""

CACHE_DIRECTORY = None
"""Directory in which to store cached annotations."""

CACHE_COMPRESSION = None
"""Which compression to use for cache files.
See the documentation of --cache-compression."""

HTML_MINIFICATION = False
"""Whether to minify generated HTML files."""

def _node_error(document, node, msg):
    err = document.reporter.error(msg, base_node=node, line=node.line)
    errid = document.set_id(err)
    pb = nodes.problematic(node.rawsource, node.rawsource, refid=errid)
    pbid = document.set_id(pb)
    err.add_backref(pbid)
    node.replace_self(pb)

def _format_errors(src, *errs):
    msg = "\n".join(map(str, errs))
    msg = "\n" + core.indent(msg, "   ") if len(errs) > 1 else  " " + msg
    if isinstance(src, nodes.Node):
        src = getattr(src, "text", src.rawsource)
    return "In {}:{}".format(src, msg)

def _try(document, fn, node, *args, **kwargs):
    try:
        return fn(node, *args, **kwargs)
    except transforms.CollectedErrors as e:
        errs = e.args
    except ValueError as e:
        errs = [e]
    _node_error(document, node, _format_errors(node, *errs))
    return None

# LATER: dataclass
class AlectryonState:
    def __init__(self, document):
        self.drivers_info: List[core.DriverInfo] = []
        self.root_is_code: bool = False
        self.transforms_executed = set()
        self.embedded_assets = []
        self.document = document
        self._config = None

    def populate_config(self):
        # Lazy because `document` isn't initialized right away, but cached
        # because constructing a ``Config`` mutates the document.
        self._config = self._config or Config(self.document)
        return self._config

    @property
    def config(self):
        return self.populate_config()

def alectryon_state(document):
    st = document.get("alectryon_state")
    if st is None:
        st = document["alectryon_state"] = AlectryonState(document)
    return st

def _sphinx_attr(document, attr):
    env = getattr(document.settings, "env", None)
    return env and getattr(env, attr)

def _sphinx_app(document):
    return _sphinx_attr(document, "app")

def _sphinx_config(document):
    return _sphinx_attr(document, "config")

def _docutils_config(document, attr, default=None):
    """Look up `attr` in Sphinx config, falling back to docutils settings."""
    value = getattr(document.settings, attr, default)
    value = getattr(_sphinx_config(document), attr, value)
    return value

def _note_pending(document, node: nodes.pending):
    """Register the transform associated to a pending node."""
    app = _sphinx_app(document)
    if app and node.transform.is_post_transform:
        return # Post-transforms are handled in sphinx.py
    document.note_pending(node)

def _gensym_stem(document, suffix=""):
    source = document.get('source', "")
    return nodes.make_id(os.path.basename(source)) + (source and suffix)

class Config:
    @staticmethod
    def _token_dict(): # Not a lambda because of pickling
        return defaultdict(list)

    def __init__(self, document):
        self.tokens_by_lang = defaultdict(self._token_dict)
        self.language_drivers = AlectryonTransform.LANGUAGE_DRIVERS.copy()
        self.driver_args: DefaultDict[str, List[str]] = defaultdict(list)
        for nm, args in AlectryonTransform.DRIVER_ARGS.items():
            self.driver_args[nm] = list(args)
        self.driver_args["sertop"].extend(AlectryonTransform.SERTOP_ARGS)
        self.document = document
        self.read_docinfo()

    def read_docinfo(self):
        # Sphinx doesn't translate ``field_list`` to ``docinfo``
        selector = lambda n: isinstance(n, (nodes.field_list, nodes.docinfo))
        for di in self.document.traverse(selector):
            for field in di.traverse(nodes.field):
                name, body = field.children
                field.text = "`:{}:`".format(name.rawsource)
                field.rawsource = ":{}: {}".format(name.rawsource, body.rawsource)
                _try(self.document, self.parse_docinfo_field,
                     field, name.rawsource, body.rawsource)
        for di in self.document.traverse(selector):
            errors = []
            for field in di.traverse(nodes.problematic):
                errors.append(field)
                field.parent.remove(field)
            if errors:
                di.parent.insert(di.parent.index(di) + 1, errors)
            if not di.children:
                di.parent.remove(di)

    def parse_docinfo_field(self, node, name, body):
        if name.startswith("alectryon/pygments/"):
            name = name[len("alectryon/pygments/"):]
            if "/" not in name:
                name = "coq/" + name # legacy syntax doesn't have coq/
                MSG = "Missing language name (did you mean `:alectryon/pygments/{}:`?)."
                msg = _format_errors(node, MSG.format(name))
                self.document.reporter.warning(msg, base_node=node, line=node.line)
            lang, token = name.split("/", maxsplit=1)
            resolve_token(token) # Check that this is a valid token
            # LATER: It would be nice to support multi-words tokens.  Using
            # ``shlex.split(body)`` instead of ``body.split()`` would work find
            # here, but the filter added by ``added_tokens`` processes words
            # (“names”) one by one, so multi-word tokens would never match.
            self.tokens_by_lang[lang][token].extend(body.split())
        elif name == "alectryon/serapi/args":
            import shlex
            self.driver_args["sertop"].extend(self.parse_args(shlex.split(body)))
        else:
            return
        node.parent.remove(node)

    @staticmethod
    def parse_args(args):
        import argparse
        p = argparse.ArgumentParser(prog=":alectryon/serapi/args:", add_help=False)
        p.add_argument("-I", "--ml-include-path", dest="I", metavar="DIR",
                       nargs=1, action="append", default=[])
        p.add_argument("-Q", "--load-path", dest="Q", metavar=("DIR", "COQDIR"),
                       nargs=2, action="append", default=[])
        p.add_argument("-R", "--rec-load-path", dest="R", metavar=("DIR", "COQDIR"),
                       nargs=2, action="append", default=[])
        for (arg, instances) in p.parse_args(args)._get_kwargs():
            for vals in instances:
                yield "-" + arg
                yield ",".join(vals)

    def get_driver_class_and_args(self, lang):
        driver_name = self.language_drivers[lang]
        driver_cls = core.resolve_driver(lang, driver_name)
        driver_args = self.driver_args[driver_name]
        assert driver_name == driver_cls.ID
        return driver_cls, driver_args

    def init_driver(self, lang):
        cls, args = self.get_driver_class_and_args(lang)
        return cls(args, fpath=self.document['source'])

class OneTimeTransform(Transform):
    is_post_transform = False

    def _apply(self):
        raise NotImplementedError()

    def _try(self, fn, node, *args, **kwargs):
        return _try(self.document, fn, node, *args, **kwargs)

    def apply(self, **_kwargs):
        # Transforms added by pending() nodes are added multiple times: once per
        # directive, and potentially once by add_transform in Sphinx, so we need
        # to make sure that running them twice is safe (in particular, we must
        # not overwrite the cache).
        state = alectryon_state(self.document)
        if type(self).__name__ not in state.transforms_executed:
            state.transforms_executed.add(type(self).__name__)
            self._apply()

class LoadConfigTransform(OneTimeTransform):
    """Process ``field_list`` and ``docinfo`` configuration.

    This transform is not strictly necessary: a ``Config`` object will be
    initialized anyway when later code calls ``AlectryonState.config``.
    The point of this transform it to detect config issues at lint time.
    """
    default_priority = 300

    def _apply(self):
        alectryon_state(self.document).populate_config()

class ActivateMathJaxTransform(OneTimeTransform):
    """Add the ``mathjax_process`` class on math nodes.

    This is needed when another part of the pipeline adds mathjax_ignore on the
    root of the document to turn off MathJax's math-detection heuristics.
    """
    default_priority = 700

    @staticmethod
    def is_math(node):
        return isinstance(node, (nodes.math, nodes.math_block))

    def _apply(self, **kwargs):
        for node in self.document.traverse(self.is_math):
            node.attributes.setdefault("classes", []).append("mathjax_process")

class DocutilsObserver(core.Observer):
    def __init__(self, document):
        self.document = document

    def _notify(self, n: core.Notification):
        loc = n.location
        beg = dict(line=loc.beg.line, column=loc.beg.col) if loc else {}
        end = dict(end_line=loc.end.line, end_column=loc.end.col) if loc and loc.end else {}
        self.document.reporter.system_message(n.level, n.message, **beg, **end)

def by_lang(pending_nodes):
    partitioned = {}
    for node in pending_nodes:
        partitioned.setdefault(node.details["lang"], []).append(node)
    return dict(sorted(partitioned.items()))

class AlectryonTransform(OneTimeTransform):
    default_priority = 800
    auto_toggle = True

    SERTOP_ARGS = ()
    """DEPRECATED; use DRIVER_ARGS["sertop"] instead."""

    LANGUAGE_DRIVERS: Dict[str, str] = core.DEFAULT_DRIVERS
    DRIVER_ARGS: Dict[str, Iterable[str]] = {d: () for d in core.ALL_DRIVERS}

    def check_for_long_lines(self, node, fragments):
        if LONG_LINE_THRESHOLD is None:
            return
        for linum, s in transforms.find_long_lines(fragments, threshold=LONG_LINE_THRESHOLD):
            msg = "Long line ({} characters)\n   {}".format(len(s), s)
            contents_line = getattr(node, "contents_line", None)
            opts = dict(line=contents_line + linum) if contents_line else {}
            w = self.document.reporter.warning(msg, base_node=node, **opts)
            # We want a message on the command line but not in the document, so
            # remove the node created by ``Reporter.system_message``:
            self.document.transform_messages.remove(w)

    def annotate(self, pending_nodes, lang, cache):
        driver = alectryon_state(self.document).config.init_driver(lang)
        driver.observer = DocutilsObserver(self.document)
        chunks = [pending.details["contents"] for pending in pending_nodes]
        annotated = cache.update(chunks, driver)
        return cache.driver_info, annotated

    def replace_node(self, pending, fragments, lang):
        directive_annots = pending.details["directive_annots"]

        fragments = transforms.inherit_io_annots(fragments, directive_annots)
        fragments = transforms.default_transform(fragments, lang=lang, delay_errors=True)
        self.check_for_long_lines(pending, fragments)

        details = {**pending.details, "fragments": fragments}
        io = alectryon_pending_io(AlectryonPostTransform, details)
        _note_pending(self.document, io)
        pending.replace_self(io)

    def apply_drivers(self):
        from .json import CacheSet
        state = alectryon_state(self.document)
        all_pending = self.document.traverse(alectryon_pending)
        with CacheSet(CACHE_DIRECTORY, self.document['source'], CACHE_COMPRESSION) as caches:
            for lang, pending_nodes in by_lang(all_pending).items():
                driver_info, annotated = self.annotate(pending_nodes, lang, caches[lang])
                state.drivers_info.append(driver_info)
                for node, fragments in zip(pending_nodes, annotated):
                    self._try(self.replace_node, node, fragments, lang)

    @staticmethod
    def split_around(node):
        parent = node.parent
        idx = node.parent.index(node)
        return parent.children[:idx], node, parent.children[idx + 1:]

    @staticmethod
    def insert_toggle_after(node, toggle, keep_node):
        pre, node, post = AlectryonTransform.split_around(node)
        if keep_node:
            pre.append(node)
        pre.append(toggle)
        pre.append(nodes.container('', *post, classes=['alectryon-container']))
        node.parent.children = pre

    def apply_toggle(self):
        toggle = lambda id: nodes.raw('', TOGGLE_HTML.format(id=id), format='html')
        toggles = list(self.document.traverse(alectryon_pending_toggle))
        for idx, node in enumerate(toggles):
            self.insert_toggle_after(node, toggle(idx), False)
            self.auto_toggle = False
        if self.auto_toggle:
            di = self.document.next_node(nodes.docinfo)
            if di:
                self.insert_toggle_after(di, toggle(0), True)

    def _apply(self):
        self.apply_drivers()
        self.apply_toggle()

class CounterStyle(namedtuple("CounterStyle", "start digits")):
    def fmt(self, num):
        raise NotImplementedError

    @staticmethod
    def of_str(style):
        digits = tuple(style.split())
        if len(digits) < 2:
            raise ValueError("Invalid counter style: {}".format(style))
        if digits[0] == "_":
            return Alphabetic(0, digits[1:])
        return Numeric(1, digits)

class Alphabetic(CounterStyle):
    def fmt(self, num):
        s, num = "", num + 1 + self.start
        while num:
            num -= 1
            num, rem = divmod(num, len(self.digits))
            s = self.digits[rem] + s
        return s

class Numeric(CounterStyle):
    def fmt(self, num):
        s, num = "", num + self.start
        while num:
            num, rem = divmod(num, len(self.digits))
            s = self.digits[rem] + s
        return s or self.digits[0]

class RefCounter:
    def __init__(self):
        self.counters = defaultdict(lambda: -1)

    def next(self, style):
        num = self.counters[style] = self.counters[style] + 1
        return style.fmt(num)

class AlectryonMrefTransform(OneTimeTransform):
    """Convert Alectryon input/output pairs into HTML or LaTeX.

    This transform is triggered by a ``pending`` node added by
    the ``:mref:`` role.
    """
    default_priority = 810

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.refcounter = RefCounter()
        self.gensym = Gensym(_gensym_stem(self.document, "-"))

    @classmethod
    def _validate_target(cls, target):
        if not target:
            raise ValueError("Target is null")

    @staticmethod
    def _find_mref_io(path, ios, last_io):
        io_name = path["io"]
        io = ios.get(io_name) if io_name else last_io
        if io is None:
            if io_name:
                raise ValueError("Reference to unknown Alectryon block.")
            raise ValueError("Not sure which code block this refers to; "
                             "add ``.io#…`` to disambiguate.")
        return io

    @classmethod
    def _find_mref_target(cls, path, io):
        fragments = io.details["fragments"]
        # LATER: Add a way to name sentences to make them easier to select
        sentences = (fr for fr in fragments if isinstance(fr, core.RichSentence))
        sentence = markers.find_one("sentence", markers.find_sentences, sentences, path["s"])

        if "in" in path:
            return sentence
        if "msg" in path:
            msgs = list(transforms.fragment_messages(sentence))
            return markers.find_one("message", markers.find_contents, msgs, path["msg"])
        if "g" in path:
            goals = list(transforms.fragment_goals(sentence))
            goal = markers.find_one("goal", markers.find_goals, goals, path["g"])
            if "ccl" in path:
                return goal.conclusion
            if "h" in path:
                hyps = goal.hypotheses
                hyp = markers.find_one("hypothesis", markers.find_hyps, hyps, path["h"])
                # Unfold to ensure visibility (but only if search succeeded)
                if sentence.annots.unfold is None:
                    sentence.annots.unfold = True
                goal.props.setdefault("unfold", True)
                if "type" in path:
                    return hyp.type
                if "body" in path:
                    return hyp.body
                if "name" in path:
                    return hyp.names
                return hyp
            if "name" in path:
                return goal.name
            return goal

        return sentence

    def format_one_ref(self, target, node):
        if not target.ids:
            target_id = nodes.make_id(node.details["target"])
            target.ids.append(self.gensym(target_id + "-")) # “-” avoids collisions
        if not target.markers:
            style = node.details["counter-style"]
            target.markers.append(node.details["title"] or self.refcounter.next(style))
        marker, refid = target.markers[-1], target.ids[-1]
        return nodes.reference(node.rawsource, marker,
                               classes=["alectryon-mref"], refid=refid)

    def format_one_quote(self, io, target, node):
        if isinstance(target, core.RichSentence):
            target = target.input
        details = {**node.details, "lang": io.details["lang"], "target": target}
        node = alectryon_pending_quote(AlectryonPostTransform, details, node.rawsource)
        _note_pending(self.document, node)
        return node

    def replace_one_mref(self, node, ios, last_io):
        kind, path = node.details["kind"], node.details["path"]
        io = self._find_mref_io(path, ios, last_io)
        target = self._find_mref_target(path, io)
        self._validate_target(target)

        if kind == "ref":
            repl = self.format_one_ref(target, node)
        elif kind == "quote":
            repl = self.format_one_quote(io, target, node)
        elif kind == "assert":
            repl = None
        else:
            assert False

        if repl:
            node.replace_self(repl)
        else:
            node.parent.remove(node)

    def _apply(self, **_kwargs):
        ios = {id: node
               for node in self.document.traverse(alectryon_pending_io)
               for id in node.get("ids", ())}
        last_io = None
        io_or_mref = lambda n: isinstance(n, (alectryon_pending_io, alectryon_pending_mref))
        for node in self.document.traverse(io_or_mref):
            if isinstance(node, alectryon_pending_io):
                last_io = node
            elif isinstance(node, alectryon_pending_mref):
                self._try(self.replace_one_mref, node, ios, last_io)

class AlectryonPostTransform(OneTimeTransform):
    """Convert Alectryon input/output pairs into HTML or LaTeX.

    This transform is triggered by a ``pending`` node added by
    ``AlectryonTransform``.  See ``docutils.components.transforms.Filter``.
    """
    default_priority = 820
    is_post_transform = True

    def _formats(self):
        app = _sphinx_app(self.document)
        if app:
            # https://github.com/sphinx-doc/sphinx/issues/9632: Sphinx sets
            # ``document.transformer`` to ``None`` when reading from cache and
            # ``transformer.components`` to ``[]`` when writing, so we can't use
            # the writer's list of supported formats when compiling with Sphinx.
            return app.tags
        return self.document.transformer.components['writer'].supported

    def init_generator(self):
        formats = set(self._formats())
        style = _docutils_config(self.document, "pygments_style")
        if 'html' in formats:
            highlighter = make_highlighter("html", None, style)
            return "html", html.HtmlGenerator(
                highlighter, _gensym_stem(self.document), HTML_MINIFICATION)
        if {'latex', 'xelatex', 'lualatex'} & formats:
            highlighter = make_highlighter("latex", None, style)
            return "latex", latex.LatexGenerator(highlighter)
        raise NotImplementedError("Unknown output format")

    @staticmethod
    def replace_one(node, fmt, rawtext, gen, *args, **kwargs):
        ids = node.attributes.get("ids", ())
        classes = node.attributes.pop("classes", ()) # visit_raw adds a <div> if it finds classes
        dom = gen(*args, ids=ids, classes=classes, **kwargs)
        node.replace_self(nodes.raw(rawtext, dom.render(pretty=False), format=fmt))

    @classmethod
    def replace_one_io(cls, node, fmt, generator):
        fragments, contents = node.details["fragments"], node.details["contents"]
        if transforms.all_hidden(fragments, node.details["directive_annots"]):
            node.parent.remove(node) # Remove ``.. coq:: none`` blocks
        else:
            cls.replace_one(node, fmt, contents, generator.gen_fragments, fragments)

    @classmethod
    def replace_one_quote(cls, node, fmt, generator):
        target = deepcopy(node.details["target"])
        # LATER don't strip markers when block-quoting a full goal or hypothesis
        target = transforms.strip_ids_and_props(target, {"enabled", "markers"})
        with generator.highlighter.override(lang=node.details["language"]):
            cls.replace_one(node, fmt, node.details["path"], generator.gen_part,
                            target, inline=node.details["inline"])

    @classmethod
    def replace_io_or_quote(cls, node, fmt, generator):
        if isinstance(node, alectryon_pending_io):
            cls.replace_one_io(node, fmt, generator)
        elif isinstance(node, alectryon_pending_quote):
            cls.replace_one_quote(node, fmt, generator)
        else:
            assert False

    def _apply(self, **_kwargs):
        io_or_quote = lambda n: isinstance(n, (alectryon_pending_io, alectryon_pending_quote))
        all_pending = self.document.traverse(io_or_quote)
        fmt, generator = self.init_generator() # Init once so gensym is shared
        for lang, pending_nodes in by_lang(all_pending).items():
            config = alectryon_state(self.document).config
            with generator.highlighter.override(lang=lang):
                with added_tokens(config.tokens_by_lang[lang], lang):
                    for node in pending_nodes:
                        self.replace_io_or_quote(node, fmt, generator)

# Directives
# ----------

INDENTATION_RE = re.compile(r"^ *(?=[^\s])")
def measure_indentation(line):
    m = INDENTATION_RE.match(line)
    return m.end() - m.start() if m else None

def measure_min_indentation(lines):
    indents = (measure_indentation(l) for l in lines)
    return min((i for i in indents if i is not None), default=0)

def recompute_contents(directive, real_indentation):
    """Compute the contents of `directive` relative to `real_indentation`.

    This undoes the automatic gobbling performed by the reST parser, which is
    useful when a Coq fragment is split across multiple code blocks; in these
    cases reST's automatic gobbling would unindent all lines.  Here is a
    concrete example (reST renders it with all lines flushed left)::

    .. code::

       int main() {

    .. code::

           return 0;

    .. code::

       }

    But beware: with alternative input languages like reCommonMark or MyST,
    there's no guarantee that the contents are indented by at least three
    spaces, so we must also measure the minimum indentation and respect that.
    """
    if directive.content_offset <= directive.lineno: # MyST bug
        return (0, "\n".join(directive.content))
    block_lines = directive.block_text.splitlines()
    block_header_len = directive.content_offset - directive.lineno + 1
    header_indentation = measure_indentation(directive.block_text)
    assert header_indentation is not None
    body_lines = block_lines[block_header_len:]
    min_indentation = measure_min_indentation(body_lines)
    body_indentation = min(header_indentation + real_indentation, min_indentation)
    contents = "\n".join(ln[body_indentation:] for ln in body_lines)
    return body_indentation, contents

class AlectryonDirective(Directive): # pylint: disable=abstract-method
    def _error(self, msg, line=None):
        line = self.lineno if line is None else line
        msg = 'Error in "{}" directive:\n{}'.format(self.name, msg)
        literal = nodes.literal_block(self.block_text, self.block_text)
        err = self.state_machine.reporter.error(msg, literal, line=self.lineno)
        return [err]

    def _try(self, fn, *args, default=None):
        try:
            return fn(*args), []
        except ValueError as e:
            return default, self._error(str(e))

class ProverDirective(AlectryonDirective):
    """Highlight and annotate a code snippet."""
    required_arguments = 0
    optional_arguments = 1
    final_argument_whitespace = True
    option_spec = {'class': directives.class_option,
                   'name': directives.unchanged}
    has_content = True

    EXPECTED_INDENTATION = 3

    @property
    def header(self):
        return "`{}`".format(self.block_text.partition('\n')[0])

    def run(self):
        self.assert_has_content()

        document = self.state_machine.document

        annotstr = " ".join(self.arguments)
        annots, errors = self._try(transforms.read_all_io_flags,
                                   annotstr, False, default=transforms.IOAnnots())

        indent, contents = recompute_contents(self, ProverDirective.EXPECTED_INDENTATION)
        source, contents_line = self.state_machine.get_source_and_line(self.content_offset + 1)

        col_offset = indent
        if document.get('source', "") == source \
           and alectryon_state(document).root_is_code:
            col_offset = 0

        pos = Position(source, contents_line, col_offset)
        contents = PosStr(contents, pos, indent)

        roles.set_classes(self.options)
        details = {"lang": self.name, "directive_annots": annots,
                   "contents": contents, "contents_line": contents_line}
        pending = alectryon_pending(AlectryonTransform, details=details,
                                    rawsource=self.header, **self.options)

        set_line(pending, self.lineno, self.state_machine)
        self.add_name(pending)
        _note_pending(document, pending)

        return [pending] + errors

def DriverDirective(lang: str):
    return type("{}Directive".format(lang.capitalize()),
                (ProverDirective,),
                {"name": lang})

DRIVER_DIRECTIVES = [DriverDirective(lang) for lang in core.ALL_LANGUAGES]

class Lean3Directive(ProverDirective):
    """Highlight and annotate a Lean 3 snippet."""
    name = "lean3"

class Lean4Directive(ProverDirective):
    """Highlight and annotate a Lean 4 snippet."""
    name = "lean4"

class AlectryonToggleDirective(Directive):
    """Display a checkbox allowing readers to show all output at once."""
    name = "alectryon-toggle"

    required_arguments = 0
    optional_arguments = 0
    option_spec: Dict[str, Any] = {}
    has_content = False

    def run(self):
        pending = alectryon_pending_toggle(AlectryonTransform)
        set_line(pending, self.lineno, self.state_machine)
        _note_pending(self.state_machine.document, pending)
        return [pending]

# This is just a small example
class ExperimentalExerciseDirective(Topic, AlectryonDirective):
    """Introduce an exercise."""
    name = "exercise"

    required_arguments = 1
    option_spec = {**Topic.option_spec,
                   "difficulty": directives.nonnegative_int,
                   "optional": directives.flag}

    def run(self):
        [node] = super().run()
        node['difficulty'] = difficulty = self.options.get('difficulty')
        node['optional'] = self.options.get('optional', False)
        if not difficulty:
            return self._error("Missing required option ':difficulty:'")
        for title in node.traverse(nodes.title):
            title.children.insert(0, nodes.Text("Exercise: "))
        return [node]

def directive_without_arguments(directive):
    """Create a fake directive sharing `directive`'s options to """
    return type("Converted", (directive,),
                dict(has_content=False,
                     required_arguments=0,
                     optional_arguments=0))

# Derived from docutils.directives.misc.Role (public domain)
# LATER: Move to upstream
class DirectiveDirective(Directive): # pragma: no cover
    """Define an alias of a directive."""

    name = "directive"
    has_content = True

    def run(self):
        if self.content_offset > self.lineno or not self.content:
            raise self.error('"%s" directive requires arguments on the first '
                             'line.' % self.name)
        args = self.content[0]
        match = Role.argument_pattern.match(args)
        if not match or not match.group(3):
            raise self.error('"%s" directive arguments not valid role names: '
                             '"%s".' % (self.name, args))
        new_name, base_name = match.group(1), match.group(3)
        messages = []

        base, messages = directives.directive(
            base_name, self.state_machine.language, self.state_machine.document)
        if base is None:
            error = self.state.reporter.error(
                'Unknown directive "%s".' % base_name,
                nodes.literal_block(self.block_text, self.block_text),
                line=self.lineno)
            return messages + [error]

        try:
            converted = directive_without_arguments(base)
            (_arguments, options, _content, _content_offset) = (
                self.state.parse_directive_block(
                self.content[1:], self.content_offset, converted,
                option_presets={}))
        except states.MarkupError as detail:
            error = self.state_machine.reporter.error(
                'Error in "%s" directive:\n%s.' % (self.name, detail),
                nodes.literal_block(self.block_text, self.block_text),
                line=self.lineno)
            return messages + [error]
        if 'class' not in options:
            try:
                options['class'] = directives.class_option(new_name)
            except ValueError as detail:
                error = self.state_machine.reporter.error(
                    'Invalid argument for "%s" directive:\n%s.'
                    % (self.name, detail), nodes.literal_block(
                    self.block_text, self.block_text), line=self.lineno)
                return messages + [error]

        # FIXME convert `base` if it's a function instead of a class
        class CustomDirective(base):
            def run(self):
                self.options = {**options, **self.options} # pylint: disable=attribute-defined-outside-init
                return super().run()

        # FIXME this leaks across documents
        directives.register_directive(new_name, CustomDirective)
        return messages

# Roles
# -----

def alectryon_bubble(role, rawtext, text, lineno, inliner,
                     options: Dict[str, Any]={}, content=[]):
    node = nodes.inline(rawtext, classes=['alectryon-bubble'])
    set_line(node, lineno, inliner.reporter)
    return [node], []

alectryon_bubble.name = "alectryon-bubble" # type: ignore

def mk_code_role(lang):
    def code_role(role, rawtext, text, lineno, inliner,
                  options: Dict[str, Any]={}, content=[]):
        options = {**options, "language": lang}
        roles.set_classes(options)
        options.setdefault("classes", []).append("highlight")
        return roles.code_role(role, rawtext, text, lineno, inliner, options, content)
    code_role.name = lang
    return code_role

CODE_ROLES = {lang: mk_code_role(lang) for lang in core.ALL_LANGUAGES}

COQ_ID_RE = re.compile(r"^(?P<title>.*?)(?:\s*<(?P<target>.*)>)?$")
COQ_IDENT_DB_URLS = [
    ("Coq", "https://coq.inria.fr/library/$modpath.html#$ident")
]

def _role_error(inliner, rawtext, msg, lineno):
    msg = _format_errors(rawtext, msg)
    err = inliner.reporter.error(msg, line=lineno)
    return [inliner.problematic(rawtext, rawtext, err)], [err]

def _parse_ref(text):
    mid = COQ_ID_RE.match(text)
    title, target = mid.group("title"), mid.group("target")
    return title, target

def coq_id_role(role, rawtext, text, lineno, inliner,
                options: Dict[str, Any]={}, content=[]):
    title, target = _parse_ref(text)

    implicit = target is None
    if implicit:
        target = title

    if "#" in target:
        modpath, ident = target.rsplit("#", 1)
        if implicit:
            # Convert `A#b` to `b` and `A#` to `A`
            title = ident if ident else modpath
    elif "." in target:
        modpath, ident = target.rsplit(".", 1)
    else:
        modpath, ident = "", target

    # Options are set using the ‘.. role’ directive
    url = options.get('url', None)
    if url is None:
        if not modpath:
            msg = "{target!r} is not a fully-qualified name.".format(target=target)
            return _role_error(inliner, rawtext, msg, lineno)

        for prefix, url in COQ_IDENT_DB_URLS:
            if prefix == modpath or modpath.startswith(prefix + "."):
                break
        else:
            MSG = ("Not sure where to find documentation for {target}.\n"
                   "Make sure that ‘{target}’ is fully qualified"
                   " and that Alectryon knows where to find it.\n"
                   "Known prefixes: {prefixes}\n"
                   "(Add prefixes to alectryon.docutils.COQ_IDENT_DB_URLS or"
                   " derive a new role from ‘coqid’ with a custom :url:).")
            prefixes = [prefix for (prefix, _) in COQ_IDENT_DB_URLS]
            msg = MSG.format(target=target, prefixes=prefixes)
            return _role_error(inliner, rawtext, msg, lineno)

    from string import Template
    uri = Template(url).safe_substitute(modpath=modpath, ident=ident)

    roles.set_classes(options)
    node = nodes.reference(rawtext, title, refuri=uri, **options)
    set_line(node, lineno, inliner.reporter)

    return [node], []

coq_id_role.name = "coqid" # type: ignore
coq_id_role.options = {'url': directives.unchanged} # type: ignore

COUNTER_STYLES = {
    'decimal': '0 1 2 3 4 5 6 7 8 9',
    'lower-alpha': '_ a b c d e f g h i j k l m n o p q r s t u v w x y z',
    'upper-alpha': '_ A B C D E F G H I J K L M N O P Q R S T U V W X Y Z',
    'lower-greek': '_ α β γ δ ε ζ η θ ι κ λ μ ν ξ ο π ρ σ τ υ φ χ ψ ω',
    'upper-greek': '_ Α Β Γ Δ Ε Ζ Η Θ Ι Κ Λ Μ Ν Ξ Ο Π Ρ Σ Τ Υ Φ Χ Ψ Ω',
}
DEFAULT_COUNTER_STYLE = CounterStyle.of_str(COUNTER_STYLES['decimal'])

MREF_KINDS = ['ref', 'quote']

def _parse_mref_target(kind, target, prefix):
    if target[0] in "#." or kind == "quote":
        path = markers.parse_path(target)
    else:
        path = {"s": markers.PlainMatcher(target), "str": ".s({})".format(target)}

    path = markers.merge_paths(prefix, path)
    path.setdefault("io", None)

    if "s" not in path:
        raise ValueError("Missing .s(…) sentence component in path.")
    if "ccl" in path or "h" in path:
        path.setdefault("g", markers.NameMatcher("1"))
    if kind == "ref" and "name" in path:
        raise ValueError("``.name`` is not supported in ``:mref:`` queries.")

    leaf = markers.set_leaf(path)
    if kind == "quote" and leaf not in ("msg", "h", "in", "type", "body", "name", "ccl"):
        MSG = "Cannot quote a full {} (``.{}``) inline."
        raise ValueError(MSG.format(markers.FULL_NAMES[leaf], leaf))

    return path

def _marker_ref(rawtext, text, lineno, document, reporter, options):
    kind = options.pop("kind", "ref")

    title, target = _parse_ref(text)
    if target is None:
        title, target = None, title

    if kind != "ref" and title:
        MSG = "Title syntax (``… <…>``) not supported with ``:m{}:``."
        raise ValueError(MSG.format(kind))

    path = _parse_mref_target(kind, target, options.pop("prefix", {}))
    cs = options.pop("counter-style", None) or DEFAULT_COUNTER_STYLE
    inline = options.pop("inline", True)
    language = options.pop("language", "coq")
    details = {"title": title,
               "target": target,
               "path": path,
               "counter-style": cs,
               "kind": kind,
               "inline": inline,
               "language": language}

    roles.set_classes(options)
    node = alectryon_pending_mref(AlectryonMrefTransform, details, rawtext, **options)
    set_line(node, lineno, reporter)
    _note_pending(document, node)
    return node

def marker_ref_role(role, rawtext, text, lineno, inliner,
                    options: Dict[str, Any]={}, content=[]):
    try:
        node = _marker_ref(
            rawtext, text, lineno, inliner.document, inliner.reporter, options)
        return [node], []
    except ValueError as e:
        return _role_error(inliner, rawtext, str(e), lineno)

def _opt_mref_counter_style(arg):
    if " " not in arg:
        arg = COUNTER_STYLES[directives.choice(arg, list(COUNTER_STYLES))]
    return CounterStyle.of_str(arg)

def _opt_mref_prefix(prefix):
    try:
        return markers.parse_path(directives.unchanged_required(prefix))
    except ValueError as e:
        raise ValueError(str(e)) from e

def _opt_mref_kind(arg):
    return directives.choice(arg, list(MREF_KINDS))

marker_ref_role.name = "mref" # type: ignore
marker_ref_role.options = { # type: ignore
    'counter-style': _opt_mref_counter_style,
    'prefix': _opt_mref_prefix,
    'kind': _opt_mref_kind
}

def marker_quote_role(role, rawtext, text, lineno, inliner,
                      options: Dict[str, Any]={}, content=[]):
    options = {**options, "kind": "quote"}
    return marker_ref_role(role, rawtext, text, lineno, inliner, options, content)

def _opt_mquote_lexer(arg):
    return get_lexer(arg) and arg

marker_quote_role.name = "mquote" # type: ignore
marker_quote_role.options = { # type: ignore
    'prefix': _opt_mref_prefix,
    'language': _opt_mquote_lexer,
}

class MQuoteDirective(AlectryonDirective):
    has_content = False
    required_arguments = 1
    optional_arguments = 0
    final_argument_whitespace = True

    name = marker_quote_role.name # type: ignore
    option_spec = {**marker_quote_role.options, # type: ignore
                   'class': directives.class_option}

    def run(self):
        rawtext, _, _ = self.block_text.partition('\n')
        sm = self.state_machine
        text = self.arguments[0]
        options = {**self.options, "kind": "quote", "inline": False}
        node, errors = self._try(_marker_ref, rawtext, text, self.lineno, sm.document, sm, options)
        return ([node] if node else []) + errors

class MAssertDirective(AlectryonDirective):
    has_content = True
    required_arguments = 0
    optional_arguments = 1
    final_argument_whitespace = True

    name = "massert"
    option_spec: Dict[str, Any] = {}

    @staticmethod
    def _gen_ref(sm, linum, refstr, options):
        refstr = refstr.strip()
        if not refstr:
            return None
        rawtext = "assertion `{}`".format(refstr)
        return _marker_ref(rawtext, refstr, linum, sm.document, sm, {**options})

    def run(self):
        sm = self.state_machine
        prefix, refs = self._try(markers.parse_path, self.arguments[0] if self.arguments else "")
        options = {**self.options, "kind": "assert", "prefix": prefix}

        for linum, refstr in enumerate(self.content, start=self.content_offset + 1):
            ref, errs = self._try(self._gen_ref, sm, linum, refstr, options)
            refs.append(ref)
            refs.extend(errs)

        return [r for r in refs if r is not None]

# Error printer
# -------------

class JsErrorObserver:
    @staticmethod
    def json_of_message(msg):
        message = msg.children[0].astext() if msg.children else "Unknown error"
        level = docutils.utils.Reporter.levels[msg['level']].lower() # type: ignore
        js = {"level": level,
              "message": message,
              "source": msg['source'],
              "line": msg.get('line', 1),
              "column": msg.get('column'),
              "end_line": msg.get('end_line'),
              "end_column": msg.get('end_column')}
        return js

    def __init__(self, stream, settings):
        self.errors = []
        self.stream = stream
        self.report_level = settings.report_level

    def __call__(self, msg):
        import json
        self.errors.append(msg)
        if self.stream and msg['level'] >= self.report_level:
            js = self.json_of_message(msg)
            json.dump(js, self.stream)
            self.stream.write('\n')

# Parser
# ------

class RSTLiterateParser(docutils.parsers.rst.Parser): # type: ignore
    """A wrapper around the reStructuredText parser for literate files."""

    LANG = ""
    supported: ClassVar[Tuple[str, ...]] = ()
    config_section = 'Literate parser'
    config_section_dependencies: ClassVar[Tuple[str, ...]] = ('parsers',)

    @staticmethod
    def rst_lines(lang, code):
        from .literate import code2rst_lines, Line
        last_line = 0
        for line in code2rst_lines(lang, code):
            if isinstance(line, Line):
                yield (str(line), line.num)
                last_line = line.num
            else:
                assert isinstance(line, str)
                yield (line, last_line)

    @classmethod
    def input_lines(cls, lang, code, source):
        from docutils.statemachine import StringList
        lines = cls.rst_lines(lang, code)
        initlist, items = [], []
        # Don't use zip(): we need lists, not tuples, and the input can be empty
        for (line, i) in lines:
            initlist.append(line)
            items.append((source, i))
        return StringList(initlist, source, items)

    def report_parsing_error(self, e):
        self.document.append(self.document.reporter.severe(
            e.message, line=e.line, column=e.column,
            end_line=e.end_line, end_column=e.end_column))

    @property
    def lang(self):
        from .literate import LANGUAGES
        return LANGUAGES[self.LANG]

    def parse(self, inputstring, document):
        """Parse `inputstring` and populate `document`, a document tree."""
        from .literate import ParsingError
        self.setup_parse(inputstring, document)
        # pylint: disable=attribute-defined-outside-init
        alectryon_state(document).root_is_code = True
        self.statemachine = docutils.parsers.rst.states.RSTStateMachine( # type: ignore
            state_classes=self.state_classes,
            initial_state=self.initial_state,
            debug=document.reporter.debug_flag)
        try:
            lines = self.input_lines(self.lang, inputstring, document['source'])
            self.statemachine.run(lines, document, inliner=self.inliner)
        except ParsingError as e:
            self.report_parsing_error(e)
        finally:
            roles._roles.pop('', None) # Reset the default role
        self.finish_parse()

class RSTCoqParser(RSTLiterateParser):
    LANG = "coq"
    supported = ("coq",)

class RSTLean3Parser(RSTLiterateParser):
    LANG = "lean3"
    supported = ("lean3",)

class RSTLean4Parser(RSTLiterateParser):
    LANG = "lean4"
    supported = ("lean4", "lean")

# Writer
# ------

def register_stylesheets(translator, stylesheets, assets_path):
    for asset in stylesheets:
        if translator.settings.embed_stylesheet:
            alectryon_state(translator.document).embedded_assets.append(asset)
            if isinstance(asset, core.Asset):
                # Inline by hand, since the file doesn't exist on disk
                contents = asset.gen(vars(translator.settings))
                translator.stylesheet.append(translator.embedded_stylesheet % contents)
                continue
            # Expand only if we're going to inline; otherwise keep relative
            asset = os.path.join(assets_path, asset)
        translator.stylesheet.append(translator.stylesheet_call(asset))

def make_HtmlTranslator(base):
    class Translator(base):
        JS = html.ASSETS.ALECTRYON_JS
        CSS = (*html.ASSETS.ALECTRYON_CSS,
               *html.ASSETS.DOCUTILS_CSS,
               *html.ASSETS.PYGMENTS_CSS)
        ADDITIONAL_HEADS = [html.ASSETS.IBM_PLEX_CDN,
                            html.ASSETS.FIRA_CODE_CDN,
                            *html.ADDITIONAL_HEADS]

        ASSETS = JS + CSS
        ASSETS_PATH = html.ASSETS.PATH

        JS_TEMPLATE = '<script type="text/javascript" src="{}"></script>\n'
        MATHJAX_URL = \
            'https://cdnjs.cloudflare.com/ajax/libs/mathjax/3.2.0/es5/tex-mml-chtml.min.js'
        mathjax_script = '<script type="text/javascript" defer src="%s"></script>\n'

        head_prefix_template = \
            '<html xmlns="http://www.w3.org/1999/xhtml" class="alectryon-standalone"' \
            ' xml:lang="%(lang)s" lang="%(lang)s">\n<head>\n'

        def __init__(self, document):
            document.settings.math_output = "MathJax " + self.MATHJAX_URL
            super().__init__(document)

            classes = [self.settings.alectryon_webpage_style]
            register_stylesheets(self, self.CSS, self.ASSETS_PATH)
            self.stylesheet.extend(self.JS_TEMPLATE.format(js) for js in self.JS)
            self.stylesheet.extend(hd + "\n" for hd in self.ADDITIONAL_HEADS)
            if HTML_MINIFICATION:
                classes.append("minified")
                self.stylesheet.extend(html.JS_UNMINIFY + "\n")

            cls = html.wrap_classes(*classes)
            self.body_prefix.append('<div class="{}">'.format(cls))

            if self.settings.alectryon_banner:
                drivers_info = alectryon_state(document).drivers_info
                include_vernums = document.settings.alectryon_vernums
                self.body_prefix.append(html.gen_banner(drivers_info, include_vernums))

            self.body_suffix.insert(0, '</div>')
    return Translator

HtmlTranslator = make_HtmlTranslator(html4css1.HTMLTranslator)
Html5Translator = make_HtmlTranslator(html5_polyglot.HTMLTranslator)

def opt_validate_style(setting, value, option_parser,
                       config_parser=None, config_section=None):
    return validate_style(value)

# WISH: Either remove these settings and expose global constants (like
# HTML_MINIFICATION), or add missing settings here.
ALECTRYON_SETTINGS: Tuple[Tuple[str, List[str], Dict[str, Any]], ...] = (
    ("Choose an Alectryon webpage style",
     ["--webpage-style"],
     {"choices": ("centered", "floating", "windowed"),
      "dest": "alectryon_webpage_style",
      "default": "centered", "metavar": "STYLE"}),
    ("Choose a Pygments style by name",
     ["--pygments-style"],
     {'default': None, 'dest': "pygments_style",
      'validator': opt_validate_style}),
    ("Omit Alectryon's explanatory header",
     ["--no-header"],
     {'default': True, 'action': 'store_false',
      'dest': "alectryon_banner",
      'validator': docutils.frontend.validate_boolean}),
    ("Omit Alectryon's version info",
     ["--no-version-numbers"],
     {'default': True, 'action': 'store_false',
      'dest': "alectryon_vernums",
      'validator': docutils.frontend.validate_boolean})
)

def make_HtmlWriter(base, translator):
    class Writer(base):
        settings_spec = (base.settings_spec +
                         ('Alectryon HTML writer options',
                          None, ALECTRYON_SETTINGS))

        settings_default_overrides = { # By default:
            # We embed the short-classes Pygments stylesheet, not the long-classes one…
            "syntax_highlight": "short",
            # … and we want to link to Alectryon's stylesheet, not embed it
            "embed_stylesheet": False,
        }

        def __init__(self, *args, **kwargs):
            super().__init__(*args, **kwargs)
            self.translator_class = translator
    return Writer

HtmlWriter = make_HtmlWriter(html4css1.Writer, HtmlTranslator)
Html5Writer = make_HtmlWriter(html5_polyglot.Writer, Html5Translator)

def make_LatexTranslator(base):
    class Translator(base):
        STY = latex.ASSETS.ALECTRYON_STY + latex.ASSETS.PYGMENTS_STY

        ASSETS = STY
        ASSETS_PATH = latex.ASSETS.PATH

        embedded_stylesheet = "%% embedded stylesheet\n\\makeatletter\n%s\n\\makeatother\n"

        def __init__(self, document, *args, **kwargs):
            super().__init__(document, *args, **kwargs)
            register_stylesheets(self, self.STY, self.ASSETS_PATH)
    return Translator

LatexTranslator = make_LatexTranslator(latex2e.LaTeXTranslator)
XeLatexTranslator = make_LatexTranslator(xetex.XeLaTeXTranslator)
LuaLatexTranslator = make_LatexTranslator(xetex.XeLaTeXTranslator) # Same translator

def make_LatexWriter(base, translator_class):
    class Writer(base):
        settings_default_overrides = {
            # We want short-name Pygments macros; alectryon.sty then maps
            # \DUrole to \PY.
            "syntax_highlight": "short",
        }

        def __init__(self, *args, **kwargs):
            super().__init__(*args, **kwargs)
            self.translator_class = translator_class
    return Writer

LatexWriter = make_LatexWriter(latex2e.Writer, LatexTranslator)
XeLatexWriter = make_LatexWriter(xetex.Writer, XeLatexTranslator)
LuaLatexWriter = make_LatexWriter(xetex.Writer, LuaLatexTranslator) # Same writer

class DummyTranslator:
    ASSETS: List[str] = []
    ASSETS_PATH = ""

# Linter
# ======

class EarlyTransformer(docutils.transforms.Transformer):
    """A transformer that only applies transforms below a certain threshold."""
    PRIORITY_THRESHOLD = "700-000"

    def apply_transforms(self):
        self.transforms = [t for t in self.transforms if t[0] < self.PRIORITY_THRESHOLD]
        super().apply_transforms()

class LintingReader(StandaloneReader):
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        from io import StringIO
        self.error_stream = kwargs.get("error_stream", StringIO())

    def get_transforms(self):
        return super().get_transforms() + [LoadConfigTransform]

    def new_document(self):
        doc = super().new_document()
        doc.transformer = EarlyTransformer(doc)

        js_observer = JsErrorObserver(self.error_stream, self.settings)
        doc.reporter.report_level = 0 # Report all messages
        doc.reporter.halt_level = docutils.utils.Reporter.SEVERE_LEVEL + 1 # Do not exit early
        doc.reporter.stream = False # Disable textual reporting
        doc.reporter.attach_observer(js_observer)
        doc["js_observer"] = js_observer

        return doc

class LintingWriter(docutils.writers.UnfilteredWriter):
    def translate(self):
        self.output = self.document["js_observer"].stream.getvalue()

# API
# ===

Pipeline = namedtuple("Pipeline", "reader parser translator writer")

PARSERS = {
    "coq+rst": (__name__, "RSTCoqParser"),
    "lean3+rst": (__name__, "RSTLean3Parser"),
    "lean4+rst": (__name__, "RSTLean4Parser"),
    "rst": ("docutils.parsers.rst", "Parser"),
    "md": ("alectryon.myst", "Parser"),
}

BACKENDS = {
    'webpage': {
        'html4': (HtmlTranslator, HtmlWriter),
        'html5': (Html5Translator, Html5Writer),
    },
    'latex': {
        'pdflatex': (LatexTranslator, LatexWriter),
        'xelatex': (XeLatexTranslator, XeLatexWriter),
        'lualatex': (LuaLatexTranslator, LuaLatexWriter),
    },
    'lint': {
        None: (DummyTranslator, LintingWriter),
    },
    'pseudoxml': {
        None: (DummyTranslator, ("docutils.writers.pseudoxml", "Writer")),
    }
}

def _maybe_import(tp):
    return getattr(import_module(tp[0]), tp[1]) if isinstance(tp, tuple) else tp

def get_reader(_frontend, backend):
    return LintingReader if backend == 'lint' else StandaloneReader

def get_parser(frontend):
    if frontend not in PARSERS:
        raise ValueError("Unsupported docutils frontend: {}".format(frontend))
    return _maybe_import(PARSERS[frontend])

def get_writer(backend, dialect):
    if backend not in BACKENDS:
        raise ValueError("Unsupported docutils backend: {}".format(backend))
    if dialect not in BACKENDS[backend]:
        raise ValueError("Unsupported {} dialect: {}".format(backend, dialect))
    translator, writer = BACKENDS[backend][dialect]
    return _maybe_import(translator), _maybe_import(writer)

def get_pipeline(frontend, backend, dialect):
    reader = get_reader(frontend, backend)
    parser = get_parser(frontend)
    translator, writer = get_writer(backend, dialect)
    return Pipeline(reader, parser, translator, writer)

# Entry points
# ============

NODES = [
    alectryon_pending,
    alectryon_pending_toggle,
    alectryon_pending_io
]
TRANSFORMS: List[Type[OneTimeTransform]] = [
    LoadConfigTransform,
    ActivateMathJaxTransform,
    AlectryonTransform,
    AlectryonMrefTransform,
    AlectryonPostTransform
]
DIRECTIVES = [
    *DRIVER_DIRECTIVES,
    AlectryonToggleDirective,
    MQuoteDirective,
    MAssertDirective,
    ExperimentalExerciseDirective,
    DirectiveDirective
]
ROLES = [
    *CODE_ROLES.values(),
    alectryon_bubble,
    coq_id_role,
    marker_ref_role,
    marker_quote_role
]

def register():
    """Tell Docutils about our roles and directives."""
    for directive in DIRECTIVES:
        directives.register_directive(directive.name, directive)
    for role in ROLES:
        roles.register_canonical_role(role.name, role)

def set_default_role(lang="coq"):
    """Set the default role (the one used with single backticks) to :``lang``:."""
    for role in ROLES:
        if role.name == lang:
            roles.DEFAULT_INTERPRETED_ROLE = CODE_ROLES["coq"].name # type: ignore
            return
    raise ValueError("Unsupported language: {}".format(lang))

def setup(lang="coq"):
    """Prepare docutils for writing documents with Alectryon.

    This includes registering Alectryon's role and directives, loading an
    improved Coq highlighter, and setting the default role to ``:lang:``.
    """
    register()
    set_default_role(lang)
    replace_builtin_lexers()