"""Several HTML builders."""
from __future__ import annotations
import contextlib
import html
import os
import posixpath
import re
import shutil
import sys
import warnings
from os import path
from pathlib import Path
from typing import TYPE_CHECKING, Any
from urllib.parse import quote
import docutils.readers.doctree
from docutils import nodes
from docutils.core import Publisher
from docutils.frontend import OptionParser
from docutils.io import DocTreeInput, StringOutput
from docutils.utils import relative_path
from sphinx import __display_version__, package_dir
from sphinx import version_info as sphinx_version
from sphinx.builders import Builder
from sphinx.builders.html._assets import (
_CascadingStyleSheet,
_file_checksum,
_JavaScript,
)
from sphinx.builders.html._build_info import BuildInfo
from sphinx.config import ENUM, Config
from sphinx.deprecation import _deprecation_warning
from sphinx.domains import Index, IndexEntry
from sphinx.environment.adapters.asset import ImageAdapter
from sphinx.environment.adapters.indexentries import IndexEntries
from sphinx.environment.adapters.toctree import document_toc, global_toctree_for_doc
from sphinx.errors import ConfigError, ThemeError
from sphinx.highlighting import PygmentsBridge
from sphinx.locale import _, __
from sphinx.search import js_index
from sphinx.theming import HTMLThemeFactory
from sphinx.util import logging
from sphinx.util._timestamps import _format_rfc3339_microseconds
from sphinx.util._uri import is_url
from sphinx.util.console import bold
from sphinx.util.display import progress_message, status_iterator
from sphinx.util.docutils import new_document
from sphinx.util.fileutil import copy_asset
from sphinx.util.i18n import format_date
from sphinx.util.inventory import InventoryFile
from sphinx.util.matching import DOTFILES, Matcher, patmatch
from sphinx.util.osutil import (
SEP,
_last_modified_time,
copyfile,
ensuredir,
os_path,
relative_uri,
)
from sphinx.writers.html import HTMLWriter
from sphinx.writers.html5 import HTML5Translator
if TYPE_CHECKING:
from collections.abc import Iterable, Iterator
from typing import TypeAlias
from docutils.nodes import Node
from docutils.readers import Reader
from sphinx.application import Sphinx
from sphinx.environment import BuildEnvironment
from sphinx.util.typing import ExtensionMetadata
#: the filename for the inventory of objects
INVENTORY_FILENAME = 'objects.inv'
logger = logging.getLogger(__name__)
return_codes_re = re.compile('[\r\n]+')
DOMAIN_INDEX_TYPE: TypeAlias = tuple[
# Index name (e.g. py-modindex)
str,
# Index class
type[Index],
# list of (heading string, list of index entries) pairs.
list[tuple[str, list[IndexEntry]]],
# whether sub-entries should start collapsed
bool,
]
def convert_locale_to_language_tag(locale: str | None) -> str | None:
"""Convert a locale string to a language tag (ex. en_US -> en-US).
refs: BCP 47 (:rfc:`5646`)
"""
if locale:
return locale.replace('_', '-')
else:
return None
[docs]
class StandaloneHTMLBuilder(Builder):
"""
Builds standalone HTML docs.
"""
name = 'html'
format = 'html'
epilog = __('The HTML pages are in %(outdir)s.')
default_translator_class = HTML5Translator
copysource = True
allow_parallel = True
out_suffix = '.html'
link_suffix = '.html' # defaults to matching out_suffix
indexer_format: Any = js_index
indexer_dumps_unicode = True
# create links to original images from images [True/False]
html_scaled_image_link = True
supported_image_types = ['image/svg+xml', 'image/png', 'image/gif', 'image/jpeg']
supported_remote_images = True
supported_data_uri_images = True
searchindex_filename = 'searchindex.js'
add_permalinks = True
allow_sharp_as_current_path = True
embedded = False # for things like HTML help or Qt help: suppresses sidebar
search = True # for things like HTML help and Apple help: suppress search
use_index = False
download_support = True # enable download role
imgpath: str = ''
domain_indices: list[DOMAIN_INDEX_TYPE] = []
def __init__(self, app: Sphinx, env: BuildEnvironment) -> None:
super().__init__(app, env)
# CSS files
self._css_files: list[_CascadingStyleSheet] = []
# JS files
self._js_files: list[_JavaScript] = []
# Cached Publisher for writing doctrees to HTML
reader: Reader[DocTreeInput] = docutils.readers.doctree.Reader(
parser_name='restructuredtext'
)
pub = Publisher(
reader=reader,
parser=reader.parser,
writer=HTMLWriter(self),
source_class=DocTreeInput,
destination=StringOutput(encoding='unicode'),
)
pub.get_settings(output_encoding='unicode', traceback=True)
self._publisher = pub
def init(self) -> None:
self.build_info = self.create_build_info()
# basename of images directory
self.imagedir = '_images'
# section numbers for headings in the currently visited document
self.secnumbers: dict[str, tuple[int, ...]] = {}
# currently written docname
self.current_docname: str = ''
self.init_templates()
self.init_highlighter()
self.init_css_files()
self.init_js_files()
html_file_suffix = self.get_builder_config('file_suffix', 'html')
if html_file_suffix is not None:
self.out_suffix = html_file_suffix
html_link_suffix = self.get_builder_config('link_suffix', 'html')
if html_link_suffix is not None:
self.link_suffix = html_link_suffix
else:
self.link_suffix = self.out_suffix
self.use_index = self.get_builder_config('use_index', 'html')
def create_build_info(self) -> BuildInfo:
return BuildInfo(self.config, self.tags, frozenset({'html'}))
def _get_translations_js(self) -> str:
candidates = [
path.join(dir, self.config.language, 'LC_MESSAGES', 'sphinx.js')
for dir in self.config.locale_dirs
] + [
path.join(
package_dir, 'locale', self.config.language, 'LC_MESSAGES', 'sphinx.js'
),
path.join(
sys.prefix, 'share/sphinx/locale', self.config.language, 'sphinx.js'
),
]
for jsfile in candidates:
if path.isfile(jsfile):
return jsfile
return ''
def _get_style_filenames(self) -> Iterator[str]:
if isinstance(self.config.html_style, str):
yield self.config.html_style
elif self.config.html_style is not None:
yield from self.config.html_style
elif self.theme:
yield from self.theme.stylesheets
else:
yield 'default.css'
def get_theme_config(self) -> tuple[str, dict[str, str | int | bool]]:
return self.config.html_theme, self.config.html_theme_options
def init_templates(self) -> None:
theme_factory = HTMLThemeFactory(self.app)
theme_name, theme_options = self.get_theme_config()
self.theme = theme_factory.create(theme_name)
self.theme_options = theme_options
self.create_template_bridge()
self.templates.init(self, self.theme)
def init_highlighter(self) -> None:
# determine Pygments style and create the highlighter
if self.config.pygments_style is not None:
style = self.config.pygments_style
elif self.theme:
# From the ``pygments_style`` theme setting
style = self.theme.pygments_style_default or 'none'
else:
style = 'sphinx'
self.highlighter = PygmentsBridge('html', style)
if self.theme:
# From the ``pygments_dark_style`` theme setting
dark_style = self.theme.pygments_style_dark
else:
dark_style = None
self.dark_highlighter: PygmentsBridge | None
if dark_style is not None:
self.dark_highlighter = PygmentsBridge('html', dark_style)
self.app.add_css_file(
'pygments_dark.css',
media='(prefers-color-scheme: dark)',
id='pygments_dark_css',
)
else:
self.dark_highlighter = None
@property
def css_files(self) -> list[_CascadingStyleSheet]:
_deprecation_warning(
__name__, f'{self.__class__.__name__}.css_files', remove=(9, 0)
)
return self._css_files
def init_css_files(self) -> None:
self._css_files = []
self.add_css_file('pygments.css', priority=200)
for filename in self._get_style_filenames():
self.add_css_file(filename, priority=200)
for filename, attrs in self.app.registry.css_files:
self.add_css_file(filename, **attrs)
for filename, attrs in self.get_builder_config('css_files', 'html'):
# User's CSSs are loaded after extensions'
attrs.setdefault('priority', 800)
self.add_css_file(filename, **attrs)
def add_css_file(self, filename: str, **kwargs: Any) -> None:
if '://' not in filename:
filename = posixpath.join('_static', filename)
if (asset := _CascadingStyleSheet(filename, **kwargs)) not in self._css_files:
self._css_files.append(asset)
@property
def script_files(self) -> list[_JavaScript]:
canonical_name = f'{self.__class__.__name__}.script_files'
_deprecation_warning(__name__, canonical_name, remove=(9, 0))
return self._js_files
def init_js_files(self) -> None:
self._js_files = []
self.add_js_file('documentation_options.js', priority=200)
self.add_js_file('doctools.js', priority=200)
self.add_js_file('sphinx_highlight.js', priority=200)
for filename, attrs in self.app.registry.js_files:
self.add_js_file(filename or '', **attrs)
for filename, attrs in self.get_builder_config('js_files', 'html'):
attrs.setdefault('priority', 800) # User's JSs are loaded after extensions'
self.add_js_file(filename or '', **attrs)
if self._get_translations_js():
self.add_js_file('translations.js')
def add_js_file(self, filename: str, **kwargs: Any) -> None:
if filename and '://' not in filename:
filename = posixpath.join('_static', filename)
if (asset := _JavaScript(filename, **kwargs)) not in self._js_files:
self._js_files.append(asset)
@property
def math_renderer_name(self) -> str | None:
name = self.get_builder_config('math_renderer', 'html')
if name is not None:
# use given name
return name
else:
# not given: choose a math_renderer from registered ones as possible
renderers = list(self.app.registry.html_inline_math_renderers)
if len(renderers) == 1:
# only default math_renderer (mathjax) is registered
return renderers[0]
elif len(renderers) == 2:
# default and another math_renderer are registered; prior the another
renderers.remove('mathjax')
return renderers[0]
else:
# many math_renderers are registered. can't choose automatically!
return None
def get_outdated_docs(self) -> Iterator[str]:
build_info_fname = self.outdir / '.buildinfo'
try:
build_info = BuildInfo.load(build_info_fname)
except ValueError as exc:
logger.warning(__('Failed to read build info file: %r'), exc)
except OSError:
# ignore errors on reading
pass
else:
if self.build_info != build_info:
# log the mismatch and backup the old build info
build_info_backup = build_info_fname.with_name('.buildinfo.bak')
try:
shutil.move(build_info_fname, build_info_backup)
self.build_info.dump(build_info_fname)
except OSError:
pass # ignore errors
else:
# only log on success
msg = __(
'build_info mismatch, copying .buildinfo to .buildinfo.bak'
)
logger.info(bold(__('building [html]: ')) + msg)
yield from self.env.found_docs
return
if self.templates:
template_mtime = int(self.templates.newest_template_mtime() * 10**6)
try:
old_mtime = _last_modified_time(build_info_fname)
except Exception:
pass
else:
# Let users know they have a newer template
if template_mtime > old_mtime:
logger.info(
bold('building [html]: ')
+ __(
'template %s has been changed since the previous build, '
'all docs will be rebuilt'
),
self.templates.newest_template_name(),
)
else:
template_mtime = 0
for docname in self.env.found_docs:
if docname not in self.env.all_docs:
logger.debug('[build target] did not in env: %r', docname)
yield docname
continue
targetname = self.get_outfilename(docname)
try:
targetmtime = _last_modified_time(targetname)
except Exception:
targetmtime = 0
try:
doc_mtime = _last_modified_time(self.env.doc2path(docname))
srcmtime = max(doc_mtime, template_mtime)
if srcmtime > targetmtime:
logger.debug(
'[build target] targetname %r(%s), template(%s), docname %r(%s)',
targetname,
_format_rfc3339_microseconds(targetmtime),
_format_rfc3339_microseconds(template_mtime),
docname,
_format_rfc3339_microseconds(doc_mtime),
)
yield docname
except OSError:
# source doesn't exist anymore
pass
def get_asset_paths(self) -> list[str]:
return self.config.html_extra_path + self.config.html_static_path
def render_partial(self, node: Node | None) -> dict[str, str]:
"""Utility: Render a lone doctree node."""
if node is None:
return {'fragment': ''}
doc = new_document('<partial node>')
doc.append(node)
self._publisher.set_source(doc)
self._publisher.publish()
return self._publisher.writer.parts
def prepare_writing(self, docnames: set[str]) -> None:
# create the search indexer
self.indexer = None
if self.search:
from sphinx.search import IndexBuilder
lang = self.config.html_search_language or self.config.language
self.indexer = IndexBuilder(
self.env,
lang,
self.config.html_search_options,
self.config.html_search_scorer,
)
self.load_indexer(docnames)
self.docwriter = HTMLWriter(self)
with warnings.catch_warnings():
warnings.filterwarnings('ignore', category=DeprecationWarning)
# DeprecationWarning: The frontend.OptionParser class will be replaced
# by a subclass of argparse.ArgumentParser in Docutils 0.21 or later.
self.docsettings: Any = OptionParser(
defaults=self.env.settings,
components=(self.docwriter,),
read_config_files=True,
).get_default_values()
self.docsettings.compact_lists = bool(self.config.html_compact_lists)
# determine the additional indices to include
self.domain_indices = []
# html_domain_indices can be False/True or a list of index names
if indices_config := self.config.html_domain_indices:
if not isinstance(indices_config, bool):
check_names = True
indices_config = frozenset(indices_config)
else:
check_names = False
for domain in self.env.domains.sorted():
for index_cls in domain.indices:
index_name = f'{domain.name}-{index_cls.name}'
if check_names and index_name not in indices_config:
continue
content, collapse = index_cls(domain).generate()
if content:
self.domain_indices.append((
index_name,
index_cls,
content,
collapse,
))
# format the "last updated on" string, only once is enough since it
# typically doesn't include the time of day
last_updated: str | None
if (lu_fmt := self.config.html_last_updated_fmt) is not None:
last_updated = format_date(
lu_fmt or _('%b %d, %Y'),
language=self.config.language,
local_time=not self.config.html_last_updated_use_utc,
)
else:
last_updated = None
# If the logo or favicon are urls, keep them as-is, otherwise
# strip the relative path as the files will be copied into _static.
logo = self.config.html_logo or ''
favicon = self.config.html_favicon or ''
if not is_url(logo):
logo = path.basename(logo)
if not is_url(favicon):
favicon = path.basename(favicon)
self.relations = self.env.collect_relations()
rellinks: list[tuple[str, str, str, str]] = []
if self.use_index:
rellinks.append(('genindex', _('General Index'), 'I', _('index')))
for indexname, indexcls, _content, _collapse in self.domain_indices:
# if it has a short name
if indexcls.shortname:
rellinks.append((indexname, indexcls.localname, '', indexcls.shortname))
# add assets registered after ``Builder.init()``.
for css_filename, attrs in self.app.registry.css_files:
self.add_css_file(css_filename, **attrs)
for js_filename, attrs in self.app.registry.js_files:
self.add_js_file(js_filename or '', **attrs)
# back up _css_files and _js_files to allow adding CSS/JS files to a specific page.
self._orig_css_files = list(dict.fromkeys(self._css_files))
self._orig_js_files = list(dict.fromkeys(self._js_files))
styles = list(self._get_style_filenames())
self.globalcontext = {
'embedded': self.embedded,
'project': self.config.project,
'release': return_codes_re.sub('', self.config.release),
'version': self.config.version,
'last_updated': last_updated,
'copyright': self.config.copyright,
'master_doc': self.config.root_doc,
'root_doc': self.config.root_doc,
'use_opensearch': self.config.html_use_opensearch,
'docstitle': self.config.html_title,
'shorttitle': self.config.html_short_title,
'show_copyright': self.config.html_show_copyright,
'show_search_summary': self.config.html_show_search_summary,
'show_sphinx': self.config.html_show_sphinx,
'has_source': self.config.html_copy_source,
'show_source': self.config.html_show_sourcelink,
'sourcelink_suffix': self.config.html_sourcelink_suffix,
'file_suffix': self.out_suffix,
'link_suffix': self.link_suffix,
'script_files': self._js_files,
'language': convert_locale_to_language_tag(self.config.language),
'css_files': self._css_files,
'sphinx_version': __display_version__,
'sphinx_version_tuple': sphinx_version,
'docutils_version_info': docutils.__version_info__[:5],
'styles': styles,
'rellinks': rellinks,
'builder': self.name,
'parents': [],
'logo_url': logo,
'logo_alt': _('Logo of %s') % self.config.project,
'favicon_url': favicon,
'html5_doctype': True,
}
if self.theme:
self.globalcontext |= {
f'theme_{key}': val
for key, val in self.theme.get_options(self.theme_options).items()
}
self.globalcontext |= self.config.html_context
def get_doc_context(self, docname: str, body: str, metatags: str) -> dict[str, Any]:
"""Collect items for the template context of a page."""
# find out relations
prev = next = None
parents = []
rellinks = self.globalcontext['rellinks'][:]
related = self.relations.get(docname)
titles = self.env.titles
if related and related[2]:
try:
next = {
'link': self.get_relative_uri(docname, related[2]),
'title': self.render_partial(titles[related[2]])['title'],
}
rellinks.append((related[2], next['title'], 'N', _('next')))
except KeyError:
next = None
if related and related[1]:
try:
prev = {
'link': self.get_relative_uri(docname, related[1]),
'title': self.render_partial(titles[related[1]])['title'],
}
rellinks.append((related[1], prev['title'], 'P', _('previous')))
except KeyError:
# the relation is (somehow) not in the TOC tree, handle
# that gracefully
prev = None
while related and related[0]:
with contextlib.suppress(KeyError):
parents.append({
'link': self.get_relative_uri(docname, related[0]),
'title': self.render_partial(titles[related[0]])['title'],
})
related = self.relations.get(related[0])
if parents:
# remove link to the master file; we have a generic
# "back to index" link already
parents.pop()
parents.reverse()
# title rendered as HTML
title_node = self.env.longtitles.get(docname)
title = self.render_partial(title_node)['title'] if title_node else ''
# Suffix for the document
source_suffix = str(self.env.doc2path(docname, False))[len(docname) :]
# the name for the copied source
if self.config.html_copy_source:
sourcename = docname + source_suffix
if source_suffix != self.config.html_sourcelink_suffix:
sourcename += self.config.html_sourcelink_suffix
else:
sourcename = ''
# metadata for the document
meta = self.env.metadata.get(docname)
# local TOC and global TOC tree
self_toc = document_toc(self.env, docname, self.tags)
toc = self.render_partial(self_toc)['fragment']
return {
'parents': parents,
'prev': prev,
'next': next,
'title': title,
'meta': meta,
'body': body,
'metatags': metatags,
'rellinks': rellinks,
'sourcename': sourcename,
'toc': toc,
# only display a TOC if there's more than one item to show
'display_toc': (self.env.toc_num_entries[docname] > 1),
'page_source_suffix': source_suffix,
}
def copy_assets(self) -> None:
self.finish_tasks.add_task(self.copy_download_files)
self.finish_tasks.add_task(self.copy_static_files)
self.finish_tasks.add_task(self.copy_extra_files)
self.finish_tasks.join()
def write_doc(self, docname: str, doctree: nodes.document) -> None:
destination = StringOutput(encoding='utf-8')
doctree.settings = self.docsettings
self.secnumbers = self.env.toc_secnumbers.get(docname, {})
self.fignumbers = self.env.toc_fignumbers.get(docname, {})
self.imgpath = relative_uri(self.get_target_uri(docname), '_images')
self.dlpath = relative_uri(self.get_target_uri(docname), '_downloads')
self.current_docname = docname
self.docwriter.write(doctree, destination)
self.docwriter.assemble_parts()
body = self.docwriter.parts['fragment']
metatags = self.docwriter.clean_meta
ctx = self.get_doc_context(docname, body, metatags)
self.handle_page(docname, ctx, event_arg=doctree)
def write_doc_serialized(self, docname: str, doctree: nodes.document) -> None:
self.imgpath = relative_uri(self.get_target_uri(docname), self.imagedir)
self.post_process_images(doctree)
title_node = self.env.longtitles.get(docname)
title = self.render_partial(title_node)['title'] if title_node else ''
self.index_page(docname, doctree, title)
def finish(self) -> None:
self.finish_tasks.add_task(self.gen_indices)
self.finish_tasks.add_task(self.gen_pages_from_extensions)
self.finish_tasks.add_task(self.gen_additional_pages)
self.finish_tasks.add_task(self.copy_image_files)
self.finish_tasks.add_task(self.write_buildinfo)
# dump the search index
self.handle_finish()
@progress_message(__('generating indices'))
def gen_indices(self) -> None:
# the global general index
if self.use_index:
self.write_genindex()
# the global domain-specific indices
self.write_domain_indices()
def gen_pages_from_extensions(self) -> None:
# pages from extensions
for pagelist in self.events.emit('html-collect-pages'):
for pagename, context, template in pagelist:
self.handle_page(pagename, context, template)
@progress_message(__('writing additional pages'))
def gen_additional_pages(self) -> None:
# additional pages from conf.py
for pagename, template in self.config.html_additional_pages.items():
logger.info(pagename + ' ', nonl=True)
self.handle_page(pagename, {}, template)
# the search page
if self.search:
logger.info('search ', nonl=True)
self.handle_page('search', {}, 'search.html')
# the opensearch xml file
if self.config.html_use_opensearch and self.search:
logger.info('opensearch ', nonl=True)
fn = path.join(self.outdir, '_static', 'opensearch.xml')
self.handle_page('opensearch', {}, 'opensearch.xml', outfilename=fn)
def write_genindex(self) -> None:
# the total count of lines for each index letter, used to distribute
# the entries into two columns
genindex = IndexEntries(self.env).create_index(self)
indexcounts = [
sum(1 + len(subitems) for _, (_, subitems, _) in entries)
for _k, entries in genindex
]
genindexcontext = {
'genindexentries': genindex,
'genindexcounts': indexcounts,
'split_index': self.config.html_split_index,
}
logger.info('genindex ', nonl=True)
if self.config.html_split_index:
self.handle_page('genindex', genindexcontext, 'genindex-split.html')
self.handle_page('genindex-all', genindexcontext, 'genindex.html')
for (key, entries), count in zip(genindex, indexcounts, strict=True):
ctx = {
'key': key,
'entries': entries,
'count': count,
'genindexentries': genindex,
}
self.handle_page('genindex-' + key, ctx, 'genindex-single.html')
else:
self.handle_page('genindex', genindexcontext, 'genindex.html')
def write_domain_indices(self) -> None:
for indexname, indexcls, content, collapse in self.domain_indices:
indexcontext = {
'indextitle': indexcls.localname,
'content': content,
'collapse_index': collapse,
}
logger.info(indexname + ' ', nonl=True)
self.handle_page(indexname, indexcontext, 'domainindex.html')
def copy_image_files(self) -> None:
if self.images:
stringify_func = ImageAdapter(self.app.env).get_original_image_uri
ensuredir(self.outdir / self.imagedir)
for src in status_iterator(
self.images,
__('copying images... '),
'brown',
len(self.images),
self.app.verbosity,
stringify_func=stringify_func,
):
dest = self.images[src]
try:
copyfile(
self.srcdir / src,
self.outdir / self.imagedir / dest,
force=True,
)
except Exception as err:
logger.warning(
__("cannot copy image file '%s': %s"), self.srcdir / src, err
)
def copy_download_files(self) -> None:
def to_relpath(f: str) -> str:
return relative_path(self.srcdir, f)
# copy downloadable files
if self.env.dlfiles:
ensuredir(self.outdir / '_downloads')
for src in status_iterator(
self.env.dlfiles,
__('copying downloadable files... '),
'brown',
len(self.env.dlfiles),
self.app.verbosity,
stringify_func=to_relpath,
):
try:
dest = self.outdir / '_downloads' / self.env.dlfiles[src][1]
ensuredir(dest.parent)
copyfile(self.srcdir / src, dest, force=True)
except OSError as err:
logger.warning(
__('cannot copy downloadable file %r: %s'),
self.srcdir / src,
err,
)
def create_pygments_style_file(self) -> None:
"""Create a style file for pygments."""
pyg_path = path.join(self.outdir, '_static', 'pygments.css')
with open(pyg_path, 'w', encoding='utf-8') as f:
f.write(self.highlighter.get_stylesheet())
if self.dark_highlighter:
dark_path = path.join(self.outdir, '_static', 'pygments_dark.css')
with open(dark_path, 'w', encoding='utf-8') as f:
f.write(self.dark_highlighter.get_stylesheet())
def copy_translation_js(self) -> None:
"""Copy a JavaScript file for translations."""
jsfile = self._get_translations_js()
if jsfile:
copyfile(
jsfile,
self.outdir / '_static' / 'translations.js',
force=True,
)
def copy_stemmer_js(self) -> None:
"""Copy a JavaScript file for stemmer."""
if self.indexer is not None:
if hasattr(self.indexer, 'get_js_stemmer_rawcodes'):
for jsfile in self.indexer.get_js_stemmer_rawcodes():
js_path = Path(jsfile)
copyfile(
js_path,
self.outdir / '_static' / js_path.name,
force=True,
)
else:
if js_stemmer_rawcode := self.indexer.get_js_stemmer_rawcode():
copyfile(
js_stemmer_rawcode,
self.outdir / '_static' / '_stemmer.js',
force=True,
)
def copy_theme_static_files(self, context: dict[str, Any]) -> None:
def onerror(filename: str, error: Exception) -> None:
msg = __("Failed to copy a file in the theme's 'static' directory: %s: %r")
logger.warning(msg, filename, error)
if self.theme:
for entry in reversed(self.theme.get_theme_dirs()):
copy_asset(
Path(entry) / 'static',
self.outdir / '_static',
excluded=DOTFILES,
context=context,
renderer=self.templates,
onerror=onerror,
force=True,
)
def copy_html_static_files(self, context: dict[str, Any]) -> None:
def onerror(filename: str, error: Exception) -> None:
logger.warning(
__('Failed to copy a file in html_static_file: %s: %r'), filename, error
)
excluded = Matcher([*self.config.exclude_patterns, '**/.*'])
for entry in self.config.html_static_path:
copy_asset(
self.confdir / entry,
self.outdir / '_static',
excluded=excluded,
context=context,
renderer=self.templates,
onerror=onerror,
force=True,
)
def copy_html_logo(self) -> None:
if self.config.html_logo and not is_url(self.config.html_logo):
source_path = self.confdir / self.config.html_logo
copyfile(
source_path,
self.outdir / '_static' / source_path.name,
force=True,
)
def copy_html_favicon(self) -> None:
if self.config.html_favicon and not is_url(self.config.html_favicon):
source_path = self.confdir / self.config.html_favicon
copyfile(
source_path,
self.outdir / '_static' / source_path.name,
force=True,
)
def copy_static_files(self) -> None:
try:
with progress_message(__('copying static files'), nonl=False):
ensuredir(self.outdir / '_static')
# prepare context for templates
context = self.globalcontext.copy()
if self.indexer is not None:
context.update(self.indexer.context_for_searchtool())
self.create_pygments_style_file()
self.copy_translation_js()
self.copy_stemmer_js()
self.copy_theme_static_files(context)
self.copy_html_static_files(context)
self.copy_html_logo()
self.copy_html_favicon()
except OSError as err:
logger.warning(__('cannot copy static file %r'), err)
def copy_extra_files(self) -> None:
"""Copy html_extra_path files."""
try:
with progress_message(__('copying extra files'), nonl=False):
excluded = Matcher(self.config.exclude_patterns)
for extra_path in self.config.html_extra_path:
copy_asset(
self.confdir / extra_path,
self.outdir,
excluded=excluded,
force=True,
)
except OSError as err:
logger.warning(__('cannot copy extra file %r'), err)
def write_buildinfo(self) -> None:
try:
self.build_info.dump(self.outdir / '.buildinfo')
except OSError as exc:
logger.warning(__('Failed to write build info file: %r'), exc)
def cleanup(self) -> None:
# clean up theme stuff
if self.theme:
self.theme._cleanup()
def post_process_images(self, doctree: Node) -> None:
"""Pick the best candidate for an image and link down-scaled images to
their high resolution version.
"""
super().post_process_images(doctree)
if self.config.html_scaled_image_link and self.html_scaled_image_link:
for node in doctree.findall(nodes.image):
if not any((key in node) for key in ('scale', 'width', 'height')):
# resizing options are not given. scaled image link is available
# only for resized images.
continue
if isinstance(node.parent, nodes.reference):
# A image having hyperlink target
continue
if 'no-scaled-link' in node['classes']:
# scaled image link is disabled for this node
continue
uri = node['uri']
reference = nodes.reference('', '', internal=True)
if uri in self.images:
reference['refuri'] = posixpath.join(self.imgpath, self.images[uri])
else:
reference['refuri'] = uri
node.replace_self(reference)
reference.append(node)
def load_indexer(self, docnames: Iterable[str]) -> None:
assert self.indexer is not None
keep = set(self.env.all_docs) - set(docnames)
try:
searchindexfn = path.join(self.outdir, self.searchindex_filename)
if self.indexer_dumps_unicode:
with open(searchindexfn, encoding='utf-8') as ft:
self.indexer.load(ft, self.indexer_format)
else:
with open(searchindexfn, 'rb') as fb:
self.indexer.load(fb, self.indexer_format)
except (OSError, ValueError):
if keep:
logger.warning(
__(
"search index couldn't be loaded, but not all "
'documents will be built: the index will be '
'incomplete.'
)
)
# delete all entries for files that will be rebuilt
self.indexer.prune(keep)
def index_page(self, pagename: str, doctree: nodes.document, title: str) -> None:
# only index pages with title
if self.indexer is not None and title:
filename = str(self.env.doc2path(pagename, base=False))
metadata = self.env.metadata.get(pagename, {})
if 'no-search' in metadata or 'nosearch' in metadata:
self.indexer.feed(pagename, filename, '', new_document(''))
else:
self.indexer.feed(pagename, filename, title, doctree)
def _get_local_toctree(
self, docname: str, collapse: bool = True, **kwargs: Any
) -> str:
if 'includehidden' not in kwargs:
kwargs['includehidden'] = False
if kwargs.get('maxdepth') == '':
kwargs.pop('maxdepth')
toctree = global_toctree_for_doc(
self.env, docname, self, collapse=collapse, **kwargs
)
return self.render_partial(toctree)['fragment']
def get_outfilename(self, pagename: str) -> str:
return path.join(self.outdir, os_path(pagename) + self.out_suffix)
def add_sidebars(self, pagename: str, ctx: dict[str, Any]) -> None:
def has_wildcard(pattern: str) -> bool:
return any(char in pattern for char in '*?[')
matched = None
# default sidebars settings for selected theme
sidebars = list(self.theme.sidebar_templates)
# user sidebar settings
html_sidebars = self.get_builder_config('sidebars', 'html')
msg = __('page %s matches two patterns in html_sidebars: %r and %r')
for pattern, pat_sidebars in html_sidebars.items():
if patmatch(pagename, pattern):
if matched and has_wildcard(pattern):
# warn if both patterns contain wildcards
if has_wildcard(matched):
logger.warning(msg, pagename, matched)
# else the already matched pattern is more specific
# than the present one, because it contains no wildcard
continue
matched = pattern
sidebars = pat_sidebars
ctx['sidebars'] = list(sidebars)
# --------- these are overwritten by the serialization builder
def get_target_uri(self, docname: str, typ: str | None = None) -> str:
return quote(docname) + self.link_suffix
def handle_page(
self,
pagename: str,
addctx: dict[str, Any],
templatename: str = 'page.html',
outfilename: str | None = None,
event_arg: Any = None,
) -> None:
ctx = self.globalcontext.copy()
# current_page_name is backwards compatibility
ctx['pagename'] = ctx['current_page_name'] = pagename
ctx['encoding'] = self.config.html_output_encoding
default_baseuri = self.get_target_uri(pagename)
# in the singlehtml builder, default_baseuri still contains an #anchor
# part, which relative_uri doesn't really like...
default_baseuri = default_baseuri.rsplit('#', 1)[0]
if self.config.html_baseurl:
ctx['pageurl'] = posixpath.join(
self.config.html_baseurl, self.get_target_uri(pagename)
)
else:
ctx['pageurl'] = None
def pathto(
otheruri: str,
resource: bool = False,
baseuri: str = default_baseuri,
) -> str:
if resource and '://' in otheruri:
# allow non-local resources given by scheme
return otheruri
elif not resource:
otheruri = self.get_target_uri(otheruri)
uri = relative_uri(baseuri, otheruri) or '#'
if uri == '#' and not self.allow_sharp_as_current_path:
uri = baseuri
return uri
ctx['pathto'] = pathto
def hasdoc(name: str) -> bool:
if name in self.env.all_docs:
return True
if name == 'search' and self.search:
return True
return name == 'genindex' and self.get_builder_config('use_index', 'html')
ctx['hasdoc'] = hasdoc
ctx['toctree'] = lambda **kwargs: self._get_local_toctree(pagename, **kwargs)
self.add_sidebars(pagename, ctx)
ctx.update(addctx)
# 'blah.html' should have content_root = './' not ''.
ctx['content_root'] = (f'..{SEP}' * default_baseuri.count(SEP)) or f'.{SEP}'
outdir = self.app.outdir
def css_tag(css: _CascadingStyleSheet) -> str:
attrs = [
f'{key}="{html.escape(value, quote=True)}"'
for key, value in css.attributes.items()
if value is not None
]
uri = pathto(os.fspath(css.filename), resource=True)
# the EPUB format does not allow the use of query components
# the Windows help compiler requires that css links
# don't have a query component
if self.name not in {'epub', 'htmlhelp'}:
if checksum := _file_checksum(outdir, css.filename):
uri += f'?v={checksum}'
return f'<link {" ".join(sorted(attrs))} href="{uri}" />'
ctx['css_tag'] = css_tag
def js_tag(js: _JavaScript | str) -> str:
if not isinstance(js, _JavaScript):
# str value (old styled)
return f'<script src="{pathto(js, resource=True)}"></script>'
body = js.attributes.get('body', '')
attrs = [
f'{key}="{html.escape(value, quote=True)}"'
for key, value in js.attributes.items()
if key != 'body' and value is not None
]
if not js.filename:
if attrs:
return f'<script {" ".join(sorted(attrs))}>{body}</script>'
return f'<script>{body}</script>'
uri = pathto(os.fspath(js.filename), resource=True)
if 'MathJax.js?' in os.fspath(js.filename):
# MathJax v2 reads a ``?config=...`` query parameter,
# special case this and just skip adding the checksum.
# https://docs.mathjax.org/en/v2.7-latest/configuration.html#considerations-for-using-combined-configuration-files
# https://github.com/sphinx-doc/sphinx/issues/11658
pass
# the EPUB format does not allow the use of query components
elif self.name != 'epub':
if checksum := _file_checksum(outdir, js.filename):
uri += f'?v={checksum}'
if attrs:
return f'<script {" ".join(sorted(attrs))} src="{uri}"></script>'
return f'<script src="{uri}"></script>'
ctx['js_tag'] = js_tag
# revert _css_files and _js_files
self._css_files[:] = self._orig_css_files
self._js_files[:] = self._orig_js_files
self.update_page_context(pagename, templatename, ctx, event_arg)
newtmpl = self.app.emit_firstresult(
'html-page-context', pagename, templatename, ctx, event_arg
)
if newtmpl:
templatename = newtmpl
# sort JS/CSS before rendering HTML
try: # NoQA: SIM105
# Convert script_files to list to support non-list script_files (refs: #8889)
ctx['script_files'] = sorted(
ctx['script_files'], key=lambda js: js.priority
)
except AttributeError:
# Skip sorting if users modifies script_files directly (maybe via `html_context`).
# refs: #8885
#
# Note: priority sorting feature will not work in this case.
pass
with contextlib.suppress(AttributeError):
ctx['css_files'] = sorted(ctx['css_files'], key=lambda css: css.priority)
try:
output = self.templates.render(templatename, ctx)
except UnicodeError:
logger.warning(
__(
'a Unicode error occurred when rendering the page %s. '
'Please make sure all config values that contain '
'non-ASCII content are Unicode strings.'
),
pagename,
)
return
except Exception as exc:
msg = __('An error happened in rendering the page %s.\nReason: %r') % (
pagename,
exc,
)
raise ThemeError(msg) from exc
if not outfilename:
outfilename = self.get_outfilename(pagename)
# outfilename's path is in general different from self.outdir
ensuredir(path.dirname(outfilename))
try:
with open(
outfilename, 'w', encoding=ctx['encoding'], errors='xmlcharrefreplace'
) as f:
f.write(output)
except OSError as err:
logger.warning(__('error writing file %s: %s'), outfilename, err)
if self.copysource and ctx.get('sourcename'):
# copy the source file for the "show source" link
source_name = path.join(self.outdir, '_sources', os_path(ctx['sourcename']))
ensuredir(path.dirname(source_name))
copyfile(self.env.doc2path(pagename), source_name, force=True)
def update_page_context(
self, pagename: str, templatename: str, ctx: dict[str, Any], event_arg: Any
) -> None:
pass
def handle_finish(self) -> None:
self.finish_tasks.add_task(self.dump_search_index)
self.finish_tasks.add_task(self.dump_inventory)
@progress_message(__('dumping object inventory'))
def dump_inventory(self) -> None:
InventoryFile.dump(path.join(self.outdir, INVENTORY_FILENAME), self.env, self)
def dump_search_index(self) -> None:
if self.indexer is None:
return
with progress_message(__('dumping search index in %s') % self.indexer.label()):
self.indexer.prune(self.env.all_docs)
searchindexfn = path.join(self.outdir, self.searchindex_filename)
# first write to a temporary file, so that if dumping fails,
# the existing index won't be overwritten
if self.indexer_dumps_unicode:
with open(searchindexfn + '.tmp', 'w', encoding='utf-8') as ft:
self.indexer.dump(ft, self.indexer_format)
else:
with open(searchindexfn + '.tmp', 'wb') as fb:
self.indexer.dump(fb, self.indexer_format)
os.replace(searchindexfn + '.tmp', searchindexfn)
def convert_html_css_files(app: Sphinx, config: Config) -> None:
"""Convert string styled html_css_files to tuple styled one."""
html_css_files: list[tuple[str, dict[str, str]]] = []
for entry in config.html_css_files:
if isinstance(entry, str):
html_css_files.append((entry, {}))
else:
try:
filename, attrs = entry
html_css_files.append((filename, attrs))
except Exception:
logger.warning(__('invalid css_file: %r, ignored'), entry)
continue
config.html_css_files = html_css_files
def convert_html_js_files(app: Sphinx, config: Config) -> None:
"""Convert string styled html_js_files to tuple styled one."""
html_js_files: list[tuple[str, dict[str, str]]] = []
for entry in config.html_js_files:
if isinstance(entry, str):
html_js_files.append((entry, {}))
else:
try:
filename, attrs = entry
html_js_files.append((filename, attrs))
except Exception:
logger.warning(__('invalid js_file: %r, ignored'), entry)
continue
config.html_js_files = html_js_files
def setup_resource_paths(
app: Sphinx,
pagename: str,
templatename: str,
context: dict[str, Any],
doctree: Node,
) -> None:
"""Set up relative resource paths."""
pathto = context['pathto']
# favicon_url
favicon_url = context.get('favicon_url')
if favicon_url and not is_url(favicon_url):
context['favicon_url'] = pathto('_static/' + favicon_url, resource=True)
# logo_url
logo_url = context.get('logo_url')
if logo_url and not is_url(logo_url):
context['logo_url'] = pathto('_static/' + logo_url, resource=True)
def validate_math_renderer(app: Sphinx) -> None:
if app.builder.format != 'html':
return
name = app.builder.math_renderer_name # type: ignore[attr-defined]
if name is None:
msg = __(
'Many math_renderers are registered. But no math_renderer is selected.'
)
raise ConfigError(msg)
if name not in app.registry.html_inline_math_renderers:
raise ConfigError(__('Unknown math_renderer %r is given.') % name)
def validate_html_extra_path(app: Sphinx, config: Config) -> None:
"""Check html_extra_paths setting."""
for entry in config.html_extra_path[:]:
extra_path = path.normpath(path.join(app.confdir, entry))
if not path.exists(extra_path):
logger.warning(__('html_extra_path entry %r does not exist'), entry)
config.html_extra_path.remove(entry)
elif (
path.splitdrive(app.outdir)[0] == path.splitdrive(extra_path)[0]
and path.commonpath((app.outdir, extra_path)) == path.normpath(app.outdir)
): # fmt: skip
logger.warning(
__('html_extra_path entry %r is placed inside outdir'), entry
)
config.html_extra_path.remove(entry)
def validate_html_static_path(app: Sphinx, config: Config) -> None:
"""Check html_static_paths setting."""
for entry in config.html_static_path[:]:
static_path = path.normpath(path.join(app.confdir, entry))
if not path.exists(static_path):
logger.warning(__('html_static_path entry %r does not exist'), entry)
config.html_static_path.remove(entry)
elif (
path.splitdrive(app.outdir)[0] == path.splitdrive(static_path)[0]
and path.commonpath((app.outdir, static_path)) == path.normpath(app.outdir)
): # fmt: skip
logger.warning(
__('html_static_path entry %r is placed inside outdir'), entry
)
config.html_static_path.remove(entry)
def validate_html_logo(app: Sphinx, config: Config) -> None:
"""Check html_logo setting."""
if (
config.html_logo
and not path.isfile(path.join(app.confdir, config.html_logo))
and not is_url(config.html_logo)
):
logger.warning(__('logo file %r does not exist'), config.html_logo)
config.html_logo = None
def validate_html_favicon(app: Sphinx, config: Config) -> None:
"""Check html_favicon setting."""
if (
config.html_favicon
and not path.isfile(path.join(app.confdir, config.html_favicon))
and not is_url(config.html_favicon)
):
logger.warning(__('favicon file %r does not exist'), config.html_favicon)
config.html_favicon = None
def error_on_html_sidebars_string_values(app: Sphinx, config: Config) -> None:
"""Support removed in Sphinx 2."""
errors = {}
for pattern, pat_sidebars in config.html_sidebars.items():
if isinstance(pat_sidebars, str):
errors[pattern] = [pat_sidebars]
if not errors:
return
msg = __(
"Values in 'html_sidebars' must be a list of strings. "
'At least one pattern has a string value: %s. '
'Change to `html_sidebars = %r`.'
)
bad_patterns = ', '.join(map(repr, errors))
fixed = config.html_sidebars | errors
raise ConfigError(msg % (bad_patterns, fixed))
def error_on_html_4(_app: Sphinx, config: Config) -> None:
"""Error on HTML 4."""
if config.html4_writer:
msg = __(
'HTML 4 is no longer supported by Sphinx. '
'("html4_writer=True" detected in configuration options)',
)
raise ConfigError(msg)
def setup(app: Sphinx) -> ExtensionMetadata:
# builders
app.add_builder(StandaloneHTMLBuilder)
# config values
app.add_config_value('html_theme', 'alabaster', 'html')
app.add_config_value('html_theme_path', [], 'html')
app.add_config_value('html_theme_options', {}, 'html')
app.add_config_value(
'html_title',
lambda c: _('%s %s documentation') % (c.project, c.release),
'html',
str,
)
app.add_config_value('html_short_title', lambda self: self.html_title, 'html')
app.add_config_value('html_style', None, 'html', {list, str})
app.add_config_value('html_logo', None, 'html', str)
app.add_config_value('html_favicon', None, 'html', str)
app.add_config_value('html_css_files', [], 'html')
app.add_config_value('html_js_files', [], 'html')
app.add_config_value('html_static_path', [], 'html')
app.add_config_value('html_extra_path', [], 'html')
app.add_config_value('html_last_updated_fmt', None, 'html', str)
app.add_config_value('html_last_updated_use_utc', False, 'html', types={bool})
app.add_config_value('html_sidebars', {}, 'html')
app.add_config_value('html_additional_pages', {}, 'html')
app.add_config_value('html_domain_indices', True, 'html', types={set, list})
app.add_config_value('html_permalinks', True, 'html')
app.add_config_value('html_permalinks_icon', 'ΒΆ', 'html')
app.add_config_value('html_use_index', True, 'html')
app.add_config_value('html_split_index', False, 'html')
app.add_config_value('html_copy_source', True, 'html')
app.add_config_value('html_show_sourcelink', True, 'html')
app.add_config_value('html_sourcelink_suffix', '.txt', 'html')
app.add_config_value('html_use_opensearch', '', 'html')
app.add_config_value('html_file_suffix', None, 'html', str)
app.add_config_value('html_link_suffix', None, 'html', str)
app.add_config_value('html_show_copyright', True, 'html')
app.add_config_value('html_show_search_summary', True, 'html')
app.add_config_value('html_show_sphinx', True, 'html')
app.add_config_value('html_context', {}, 'html')
app.add_config_value('html_output_encoding', 'utf-8', 'html')
app.add_config_value('html_compact_lists', True, 'html')
app.add_config_value('html_secnumber_suffix', '. ', 'html')
app.add_config_value('html_search_language', None, 'html', str)
app.add_config_value('html_search_options', {}, 'html')
app.add_config_value('html_search_scorer', '', '')
app.add_config_value('html_scaled_image_link', True, 'html')
app.add_config_value('html_baseurl', '', 'html')
# removal is indefinitely on hold (ref: https://github.com/sphinx-doc/sphinx/issues/10265)
app.add_config_value(
'html_codeblock_linenos_style', 'inline', 'html', ENUM('table', 'inline')
)
app.add_config_value('html_math_renderer', None, 'env')
app.add_config_value('html4_writer', False, 'html')
# events
app.add_event('html-collect-pages')
app.add_event('html-page-context')
# event handlers
app.connect('config-inited', convert_html_css_files, priority=800)
app.connect('config-inited', convert_html_js_files, priority=800)
app.connect('config-inited', validate_html_extra_path, priority=800)
app.connect('config-inited', validate_html_static_path, priority=800)
app.connect('config-inited', validate_html_logo, priority=800)
app.connect('config-inited', validate_html_favicon, priority=800)
app.connect('config-inited', error_on_html_sidebars_string_values, priority=800)
app.connect('config-inited', error_on_html_4, priority=800)
app.connect('builder-inited', validate_math_renderer)
app.connect('html-page-context', setup_resource_paths)
# load default math renderer
app.setup_extension('sphinx.ext.mathjax')
# load transforms for HTML builder
app.setup_extension('sphinx.builders.html.transforms')
return {
'version': 'builtin',
'parallel_read_safe': True,
'parallel_write_safe': True,
}
# deprecated name -> (object to return, canonical path or empty string, removal version)
_DEPRECATED_OBJECTS: dict[str, tuple[Any, str, tuple[int, int]]] = {
'Stylesheet': (
_CascadingStyleSheet,
'sphinx.builders.html._assets._CascadingStyleSheet',
(9, 0),
),
'JavaScript': (_JavaScript, 'sphinx.builders.html._assets._JavaScript', (9, 0)),
}
def __getattr__(name: str) -> Any:
if name not in _DEPRECATED_OBJECTS:
msg = f'module {__name__!r} has no attribute {name!r}'
raise AttributeError(msg)
from sphinx.deprecation import _deprecation_warning
deprecated_object, canonical_name, remove = _DEPRECATED_OBJECTS[name]
_deprecation_warning(__name__, name, canonical_name, remove=remove)
return deprecated_object