# $Id: __init__.py 9956 2024-10-20 19:45:21Z milde $ # Author: David Goodger # Copyright: This module has been placed in the public domain. """ This package contains Docutils Writer modules. """ from __future__ import annotations __docformat__ = 'reStructuredText' import importlib from typing import TYPE_CHECKING import docutils from docutils import languages, Component from docutils.transforms import universal if TYPE_CHECKING: from typing import Any, Final from docutils import nodes from docutils.io import Output from docutils.languages import LanguageModule from docutils.transforms import Transform class Writer(Component): """ Abstract base class for docutils Writers. Each writer module or package must export a subclass also called 'Writer'. Each writer must support all standard node types listed in `docutils.nodes.node_class_names`. The `write()` method is the main entry point. """ component_type: Final = 'writer' config_section: Final = 'writers' def get_transforms(self) -> list[type[Transform]]: return super().get_transforms() + [universal.Messages, universal.FilterMessages, universal.StripClassesAndElements] document: nodes.document | None = None """The document to write (Docutils doctree); set by `write()`.""" output: str | bytes | None = None """Final translated form of `document` (`str` for text, `bytes` for binary formats); set by `translate()`. """ language: LanguageModule | None = None """Language module for the document; set by `write()`.""" destination: Output | None = None """`docutils.io` Output object; where to write the document. Set by `write()`. """ def __init__(self) -> None: self.parts: dict[str, Any] = {} """Mapping of document part names to fragments of `self.output`. See `Writer.assemble_parts()` below and . """ def write(self, document: nodes.document, destination: Output ) -> str | bytes | None: """ Process a document into its final form. Translate `document` (a Docutils document tree) into the Writer's native format, and write it out to its `destination` (a `docutils.io.Output` subclass object). Normally not overridden or extended in subclasses. """ self.document = document self.language = languages.get_language( document.settings.language_code, document.reporter) self.destination = destination self.translate() return self.destination.write(self.output) def translate(self) -> None: """ Do final translation of `self.document` into `self.output`. Called from `write`. Override in subclasses. Usually done with a `docutils.nodes.NodeVisitor` subclass, in combination with a call to `docutils.nodes.Node.walk()` or `docutils.nodes.Node.walkabout()`. The ``NodeVisitor`` subclass must support all standard elements (listed in `docutils.nodes.node_class_names`) and possibly non-standard elements used by the current Reader as well. """ raise NotImplementedError('subclass must override this method') def assemble_parts(self) -> None: """Assemble the `self.parts` dictionary. Extend in subclasses. See . """ self.parts['whole'] = self.output self.parts['encoding'] = self.document.settings.output_encoding self.parts['errors'] = ( self.document.settings.output_encoding_error_handler) self.parts['version'] = docutils.__version__ class UnfilteredWriter(Writer): """ A writer that passes the document tree on unchanged (e.g. a serializer.) Documents written by UnfilteredWriters are typically reused at a later date using a subclass of `readers.ReReader`. """ def get_transforms(self) -> list[type[Transform]]: # Do not add any transforms. When the document is reused # later, the then-used writer will add the appropriate # transforms. return Component.get_transforms(self) WRITER_ALIASES = {'html': 'html4css1', # may change to html5 some day 'html4': 'html4css1', 'xhtml10': 'html4css1', 'html5': 'html5_polyglot', 'xhtml': 'html5_polyglot', 's5': 's5_html', 'latex': 'latex2e', 'xelatex': 'xetex', 'luatex': 'xetex', 'lualatex': 'xetex', 'odf': 'odf_odt', 'odt': 'odf_odt', 'ooffice': 'odf_odt', 'openoffice': 'odf_odt', 'libreoffice': 'odf_odt', 'pprint': 'pseudoxml', 'pformat': 'pseudoxml', 'pdf': 'rlpdf', 'xml': 'docutils_xml', } def get_writer_class(writer_name: str) -> type[Writer]: """Return the Writer class from the `writer_name` module.""" name = writer_name.lower() name = WRITER_ALIASES.get(name, name) try: module = importlib.import_module('docutils.writers.'+name) except ImportError: try: module = importlib.import_module(name) except ImportError as err: raise ImportError(f'Writer "{writer_name}" not found. {err}') return module.Writer