# -*- coding: utf-8 -*-
# Author: Óscar Nájera
# License: 3-clause BSD
"""
Sphinx-Gallery Generator
========================
Attaches Sphinx-Gallery to Sphinx in order to generate the galleries
when building the documentation.
"""
from __future__ import division, print_function, absolute_import
import codecs
import copy
from datetime import timedelta, datetime
from difflib import get_close_matches
from importlib import import_module
import re
import os
import pathlib
from xml.sax.saxutils import quoteattr, escape
from sphinx.errors import ConfigError, ExtensionError
import sphinx.util
from sphinx.util.console import red
from . import glr_path_static, __version__ as _sg_version
from .utils import _replace_md5, _has_optipng, _has_pypandoc, _has_graphviz
from .backreferences import _finalize_backreferences
from .gen_rst import (generate_dir_rst, SPHX_GLR_SIG, _get_memory_base,
_get_readme)
from .scrapers import _scraper_dict, _reset_dict, _import_matplotlib
from .docs_resolv import embed_code_links
from .downloads import generate_zipfiles
from .sorting import NumberOfCodeLinesSortKey
from .interactive_example import (
copy_binder_files, check_binder_conf, check_jupyterlite_conf
)
from .interactive_example import pre_configure_jupyterlite_sphinx
from .interactive_example import post_configure_jupyterlite_sphinx
from .interactive_example import create_jupyterlite_contents
from .directives import MiniGallery, ImageSg, imagesg_addnode
_KNOWN_CSS = ('sg_gallery', 'sg_gallery-binder', 'sg_gallery-dataframe',
'sg_gallery-rendered-html')
[docs]class DefaultResetArgv:
def __repr__(self):
return "DefaultResetArgv"
def __call__(self, gallery_conf, script_vars):
return []
DEFAULT_GALLERY_CONF = {
'filename_pattern': re.escape(os.sep) + 'plot',
'ignore_pattern': r'__init__\.py',
'examples_dirs': os.path.join('..', 'examples'),
'reset_argv': DefaultResetArgv(),
'subsection_order': None,
'within_subsection_order': NumberOfCodeLinesSortKey,
'gallery_dirs': 'auto_examples',
'backreferences_dir': None,
'doc_module': (),
'exclude_implicit_doc': {},
'reference_url': {},
'capture_repr': ('_repr_html_', '__repr__'),
'ignore_repr_types': r'',
# Build options
# -------------
# 'plot_gallery' also accepts strings that evaluate to a bool, e.g. "True",
# "False", "1", "0" so that they can be easily set via command line
# switches of sphinx-build
'plot_gallery': 'True',
'download_all_examples': True,
'abort_on_example_error': False,
'only_warn_on_example_error': False,
'failing_examples': {},
'passing_examples': [],
'stale_examples': [], # ones that did not need to be run due to md5sum
'run_stale_examples': False,
'expected_failing_examples': set(),
'thumbnail_size': (400, 280), # Default CSS does 0.4 scaling (160, 112)
'min_reported_time': 0,
'binder': {},
'jupyterlite': {},
'promote_jupyter_magic': False,
'image_scrapers': ('matplotlib',),
'compress_images': (),
'reset_modules': ('matplotlib', 'seaborn'),
'reset_modules_order': 'before',
'first_notebook_cell': None,
'last_notebook_cell': None,
'notebook_images': False,
'pypandoc': False,
'remove_config_comments': False,
'show_memory': False,
'show_signature': True,
'junit': '',
'log_level': {'backreference_missing': 'warning'},
'inspect_global_variables': True,
'css': _KNOWN_CSS,
'matplotlib_animations': False,
'image_srcset': [],
'default_thumb_file': None,
'line_numbers': False,
'nested_sections': True,
'prefer_full_module': [],
'api_usage_ignore': '.*__.*__',
'show_api_usage': False, # if this changes, change write_api_entries, too
'copyfile_regex': '',
}
logger = sphinx.util.logging.getLogger('sphinx-gallery')
def _bool_eval(x):
if isinstance(x, str):
try:
x = eval(x)
except TypeError:
pass
return bool(x)
[docs]def parse_config(app, check_keys=True):
"""Process the Sphinx Gallery configuration."""
plot_gallery = _bool_eval(app.builder.config.plot_gallery)
src_dir = app.builder.srcdir
abort_on_example_error = _bool_eval(
app.builder.config.abort_on_example_error)
lang = app.builder.config.highlight_language
gallery_conf = _complete_gallery_conf(
app.config.sphinx_gallery_conf, src_dir, plot_gallery,
abort_on_example_error, lang, app.builder.name, app,
check_keys)
# this assures I can call the config in other places
app.config.sphinx_gallery_conf = gallery_conf
app.config.html_static_path.append(glr_path_static())
return gallery_conf
def _update_gallery_conf(gallery_conf):
"""Update gallery config.
This is separate function for better testability.
"""
# prepare regex for exclusions from implicit documentation
exclude_regex = re.compile('|'.join(gallery_conf['exclude_implicit_doc']))\
if gallery_conf['exclude_implicit_doc'] else False
gallery_conf['exclude_implicit_doc_regex'] = exclude_regex
def _complete_gallery_conf(sphinx_gallery_conf, src_dir, plot_gallery,
abort_on_example_error, lang='python',
builder_name='html', app=None, check_keys=True):
gallery_conf = copy.deepcopy(DEFAULT_GALLERY_CONF)
options = sorted(gallery_conf)
# sphinx-autoapi can run before our config filling can occur, which
# when used with show_api_usage=True can cause us to add this early.
# In theory we could bump our priority above theirs, but this could have
# unintented consequences.
ignore_keys = ('_sg_api_entries',)
extra_keys = sorted(
(set(sphinx_gallery_conf) - set(options)) - set(ignore_keys)
)
if extra_keys and check_keys:
msg = 'Unknown key(s) in sphinx_gallery_conf:\n'
for key in extra_keys:
options = get_close_matches(key, options, cutoff=0.66)
msg += repr(key)
if len(options) == 1:
msg += ', did you mean %r?' % (options[0],)
elif len(options) > 1:
msg += ', did you mean one of %r?' % (options,)
msg += '\n'
raise ConfigError(msg.strip())
gallery_conf.update(sphinx_gallery_conf)
gallery_conf.update(plot_gallery=plot_gallery)
gallery_conf.update(abort_on_example_error=abort_on_example_error)
# XXX anything that can only be a bool (rather than str) should probably be
# evaluated this way as it allows setting via -D on the command line
for key in ('promote_jupyter_magic', 'run_stale_examples',):
gallery_conf[key] = _bool_eval(gallery_conf[key])
gallery_conf['src_dir'] = src_dir
gallery_conf['app'] = app
# Check capture_repr
capture_repr = gallery_conf['capture_repr']
supported_reprs = ['__repr__', '__str__', '_repr_html_']
if isinstance(capture_repr, tuple):
for rep in capture_repr:
if rep not in supported_reprs:
raise ConfigError("All entries in 'capture_repr' must be one "
"of %s, got: %s" % (supported_reprs, rep))
else:
raise ConfigError("'capture_repr' must be a tuple, got: %s"
% (type(capture_repr),))
# Check ignore_repr_types
if not isinstance(gallery_conf['ignore_repr_types'], str):
raise ConfigError("'ignore_repr_types' must be a string, got: %s"
% (type(gallery_conf['ignore_repr_types']),))
# deal with show_memory
gallery_conf['memory_base'] = 0.
if gallery_conf['show_memory']:
if not callable(gallery_conf['show_memory']): # True-like
try:
from memory_profiler import memory_usage # noqa
except ImportError:
logger.warning("Please install 'memory_profiler' to enable "
"peak memory measurements.")
gallery_conf['show_memory'] = False
else:
def call_memory(func):
mem, out = memory_usage(func, max_usage=True, retval=True,
multiprocess=True)
try:
mem = mem[0] # old MP always returned a list
except TypeError: # 'float' object is not subscriptable
pass
return mem, out
gallery_conf['call_memory'] = call_memory
gallery_conf['memory_base'] = _get_memory_base(gallery_conf)
else:
gallery_conf['call_memory'] = gallery_conf['show_memory']
if not gallery_conf['show_memory']: # can be set to False above
def call_memory(func):
return 0., func()
gallery_conf['call_memory'] = call_memory
assert callable(gallery_conf['call_memory'])
# deal with scrapers
scrapers = gallery_conf['image_scrapers']
if not isinstance(scrapers, (tuple, list)):
scrapers = [scrapers]
scrapers = list(scrapers)
for si, scraper in enumerate(scrapers):
if isinstance(scraper, str):
if scraper in _scraper_dict:
scraper = _scraper_dict[scraper]
else:
orig_scraper = scraper
try:
scraper = import_module(scraper)
scraper = getattr(scraper, '_get_sg_image_scraper')
scraper = scraper()
except Exception as exp:
raise ConfigError('Unknown image scraper %r, got:\n%s'
% (orig_scraper, exp))
scrapers[si] = scraper
if not callable(scraper):
raise ConfigError('Scraper %r was not callable' % (scraper,))
gallery_conf['image_scrapers'] = tuple(scrapers)
del scrapers
# Here we try to set up matplotlib but don't raise an error,
# we will raise an error later when we actually try to use it
# (if we do so) in scrapers.py.
# In principle we could look to see if there is a matplotlib scraper
# in our scrapers list, but this would be backward incompatible with
# anyone using or relying on our Agg-setting behavior (e.g., for some
# custom matplotlib SVG scraper as in our docs).
# Eventually we can make this a config var like matplotlib_agg or something
# if people need us not to set it to Agg.
try:
_import_matplotlib()
except (ImportError, ValueError):
pass
# compress_images
compress_images = gallery_conf['compress_images']
if isinstance(compress_images, str):
compress_images = [compress_images]
elif not isinstance(compress_images, (tuple, list)):
raise ConfigError('compress_images must be a tuple, list, or str, '
'got %s' % (type(compress_images),))
compress_images = list(compress_images)
allowed_values = ('images', 'thumbnails')
pops = list()
for ki, kind in enumerate(compress_images):
if kind not in allowed_values:
if kind.startswith('-'):
pops.append(ki)
continue
raise ConfigError('All entries in compress_images must be one of '
'%s or a command-line switch starting with "-", '
'got %r' % (allowed_values, kind))
compress_images_args = [compress_images.pop(p) for p in pops[::-1]]
if len(compress_images) and not _has_optipng():
logger.warning(
'optipng binaries not found, PNG %s will not be optimized'
% (' and '.join(compress_images),))
compress_images = ()
gallery_conf['compress_images'] = compress_images
gallery_conf['compress_images_args'] = compress_images_args
# deal with resetters
resetters = gallery_conf['reset_modules']
if not isinstance(resetters, (tuple, list)):
resetters = [resetters]
resetters = list(resetters)
for ri, resetter in enumerate(resetters):
if isinstance(resetter, str):
if resetter not in _reset_dict:
raise ConfigError('Unknown module resetter named %r'
% (resetter,))
resetters[ri] = _reset_dict[resetter]
elif not callable(resetter):
raise ConfigError('Module resetter %r was not callable'
% (resetter,))
gallery_conf['reset_modules'] = tuple(resetters)
if not isinstance(gallery_conf['reset_modules_order'], str):
raise ConfigError('reset_modules_order must be a str, '
'got %r' % gallery_conf['reset_modules_order'])
if gallery_conf['reset_modules_order'] not in ['before', 'after', 'both']:
raise ConfigError("reset_modules_order must be in"
"['before', 'after', 'both'], "
'got %r' % gallery_conf['reset_modules_order'])
lang = lang if lang in ('python', 'python3', 'default') else 'python'
gallery_conf['lang'] = lang
del resetters
# Ensure the first cell text is a string if we have it
first_cell = gallery_conf.get("first_notebook_cell")
if (not isinstance(first_cell, str)) and (first_cell is not None):
raise ConfigError("The 'first_notebook_cell' parameter must be type "
"str or None, found type %s" % type(first_cell))
# Ensure the last cell text is a string if we have it
last_cell = gallery_conf.get("last_notebook_cell")
if (not isinstance(last_cell, str)) and (last_cell is not None):
raise ConfigError("The 'last_notebook_cell' parameter must be type str"
" or None, found type %s" % type(last_cell))
# Check pypandoc
pypandoc = gallery_conf['pypandoc']
if not isinstance(pypandoc, (dict, bool)):
raise ConfigError("'pypandoc' parameter must be of type bool or dict,"
"got: %s." % type(pypandoc))
gallery_conf['pypandoc'] = dict() if pypandoc is True else pypandoc
has_pypandoc, version = _has_pypandoc()
if isinstance(gallery_conf['pypandoc'], dict) and has_pypandoc is None:
logger.warning("'pypandoc' not available. Using Sphinx-Gallery to "
"convert rst text blocks to markdown for .ipynb files.")
gallery_conf['pypandoc'] = False
elif isinstance(gallery_conf['pypandoc'], dict):
logger.info("Using pandoc version: %s to convert rst text blocks to "
"markdown for .ipynb files" % (version,))
else:
logger.info("Using Sphinx-Gallery to convert rst text blocks to "
"markdown for .ipynb files.")
if isinstance(pypandoc, dict):
accepted_keys = ('extra_args', 'filters')
for key in pypandoc:
if key not in accepted_keys:
raise ConfigError("'pypandoc' only accepts the following key "
"values: %s, got: %s."
% (accepted_keys, key))
# Make it easy to know which builder we're in
gallery_conf['builder_name'] = builder_name
gallery_conf['titles'] = {}
# Ensure 'backreferences_dir' is str, pathlib.Path or None
backref = gallery_conf['backreferences_dir']
if (not isinstance(backref, (str, pathlib.Path))) and \
(backref is not None):
raise ConfigError("The 'backreferences_dir' parameter must be of type "
"str, pathlib.Path or None, "
"found type %s" % type(backref))
# if 'backreferences_dir' is pathlib.Path, make str for Python <=3.5
# compatibility
if isinstance(backref, pathlib.Path):
gallery_conf['backreferences_dir'] = str(backref)
# binder
gallery_conf['binder'] = check_binder_conf(gallery_conf['binder'])
# jupyterlite
print('_complete_gallery_conf', gallery_conf.get('jupyterlite'))
gallery_conf['jupyterlite'] = check_jupyterlite_conf(
gallery_conf.get('jupyterlite', {}), app)
if not isinstance(gallery_conf['css'], (list, tuple)):
raise ConfigError('gallery_conf["css"] must be list or tuple, got %r'
% (gallery_conf['css'],))
for css in gallery_conf['css']:
if css not in _KNOWN_CSS:
raise ConfigError('Unknown css %r, must be one of %r'
% (css, _KNOWN_CSS))
if gallery_conf['app'] is not None: # can be None in testing
gallery_conf['app'].add_css_file(css + '.css')
# check API usage
if not isinstance(gallery_conf['api_usage_ignore'], str):
raise ConfigError('gallery_conf["api_usage_ignore"] must be str, '
'got %s' % type(gallery_conf['api_usage_ignore']))
if not isinstance(gallery_conf['show_api_usage'], bool) and \
gallery_conf['show_api_usage'] != 'unused':
raise ConfigError(
'gallery_conf["show_api_usage"] must be True, False or "unused", '
'got %s' % gallery_conf['show_api_usage'])
_update_gallery_conf(gallery_conf)
return gallery_conf
[docs]def get_subsections(srcdir, examples_dir, gallery_conf, check_for_index=True):
"""Return the list of subsections of a gallery.
Parameters
----------
srcdir : str
absolute path to directory containing conf.py
examples_dir : str
path to the examples directory relative to conf.py
gallery_conf : dict
The gallery configuration.
check_for_index : bool
only return subfolders with a ReadMe, default True
Returns
-------
out : list
sorted list of gallery subsection folder names
"""
sortkey = gallery_conf['subsection_order']
subfolders = [subfolder for subfolder in os.listdir(examples_dir)]
if check_for_index:
subfolders = [subfolder for subfolder in subfolders
if _get_readme(os.path.join(examples_dir, subfolder),
gallery_conf, raise_error=False)
is not None]
else:
# just make sure its a directory
subfolders = [subfolder for subfolder in subfolders
if os.path.isdir(os.path.join(examples_dir, subfolder))]
base_examples_dir_path = os.path.relpath(examples_dir, srcdir)
subfolders_with_path = [os.path.join(base_examples_dir_path, item)
for item in subfolders]
sorted_subfolders = sorted(subfolders_with_path, key=sortkey)
return [subfolders[i] for i in [subfolders_with_path.index(item)
for item in sorted_subfolders]]
def _prepare_sphx_glr_dirs(gallery_conf, srcdir):
"""Creates necessary folders for sphinx_gallery files """
examples_dirs = gallery_conf['examples_dirs']
gallery_dirs = gallery_conf['gallery_dirs']
if not isinstance(examples_dirs, list):
examples_dirs = [examples_dirs]
if not isinstance(gallery_dirs, list):
gallery_dirs = [gallery_dirs]
if bool(gallery_conf['backreferences_dir']):
backreferences_dir = os.path.join(
srcdir, gallery_conf['backreferences_dir'])
if not os.path.exists(backreferences_dir):
os.makedirs(backreferences_dir)
return list(zip(examples_dirs, gallery_dirs))
def _format_toctree(items, includehidden=False):
"""Format a toc tree"""
st = """
.. toctree::
:hidden:"""
if includehidden:
st += """
:includehidden:
"""
st += """
%s\n""" % "\n ".join(items)
st += "\n"
return st
[docs]def generate_gallery_rst(app):
"""Generate the Main examples gallery reStructuredText
Start the Sphinx-Gallery configuration and recursively scan the examples
directories in order to populate the examples gallery.
We create a 2-level nested structure by iterating through every
sibling folder of the current index file.
In each of these folders, we look for a section index file,
for which we generate a toctree pointing to sibling scripts.
Then, we append the content of this section index file
to the current index file,
after we remove toctree (to keep a clean nested structure)
and sphinx tags (to prevent tag duplication)
Eventually, we create a toctree in the current index file
which points to section index files.
"""
logger.info('generating gallery...', color='white')
gallery_conf = parse_config(app)
seen_backrefs = set()
costs = []
workdirs = _prepare_sphx_glr_dirs(gallery_conf,
app.builder.srcdir)
# Check for duplicate filenames to make sure linking works as expected
examples_dirs = [ex_dir for ex_dir, _ in workdirs]
files = collect_gallery_files(examples_dirs, gallery_conf)
check_duplicate_filenames(files)
check_spaces_in_filenames(files)
for examples_dir, gallery_dir in workdirs:
examples_dir_abs_path = os.path.join(app.builder.srcdir, examples_dir)
gallery_dir_abs_path = os.path.join(app.builder.srcdir, gallery_dir)
# Create section rst files and fetch content which will
# be added to current index file. This only includes content
# from files located in the root folder of the current gallery
# (ie not in subfolders)
(
_,
this_content,
this_costs,
this_toctree_items,
) = generate_dir_rst(
examples_dir_abs_path,
gallery_dir_abs_path,
gallery_conf,
seen_backrefs,
include_toctree=False,
)
has_readme = this_content is not None
costs += this_costs
write_computation_times(gallery_conf, gallery_dir_abs_path, this_costs)
# We create an index.rst with all examples
# (this will overwrite the rst file generated by the previous call
# to generate_dir_rst)
if this_content:
# :orphan: to suppress "not included in TOCTREE" sphinx warnings
indexst = ":orphan:\n\n" + this_content
else:
# we are not going to use the index.rst.new that gets made here,
# but go through the motions to run through all the subsections...
indexst = 'Never used!'
# Write toctree with gallery items from gallery root folder
if len(this_toctree_items) > 0:
this_toctree = _format_toctree(this_toctree_items)
indexst += this_toctree
# list all paths to subsection index files in this array
subsection_index_files = []
subsecs = get_subsections(app.builder.srcdir,
examples_dir_abs_path, gallery_conf,
check_for_index=has_readme)
for subsection in subsecs:
src_dir = os.path.join(examples_dir_abs_path, subsection)
target_dir = os.path.join(gallery_dir_abs_path, subsection)
subsection_index_files.append(
'/'.join([
'', gallery_dir, subsection, 'index.rst'
]).replace(os.sep, '/') # fwd slashes needed in rst
)
(
subsection_index_path,
subsection_index_content,
subsection_costs,
subsection_toctree_filenames,
) = generate_dir_rst(
src_dir, target_dir, gallery_conf, seen_backrefs
)
if subsection_index_content:
# Filter out tags from subsection content
# to prevent tag duplication across the documentation
tag_regex = r"^\.\.(\s+)\_(.+)\:(\s*)$"
subsection_index_content = "\n".join([
line for line in subsection_index_content.splitlines()
if re.match(tag_regex, line) is None
] + [''])
indexst += subsection_index_content
has_readme_subsection = True
else:
has_readme_subsection = False
# Write subsection toctree in main file only if
# nested_sections is False or None, and
# toctree filenames were generated for the subsection.
if not gallery_conf["nested_sections"]:
if len(subsection_toctree_filenames) > 0:
subsection_index_toctree = _format_toctree(
subsection_toctree_filenames)
indexst += subsection_index_toctree
# Otherwise, a new index.rst.new file should
# have been created and it needs to be parsed
elif has_readme_subsection:
_replace_md5(subsection_index_path, mode='t')
costs += subsection_costs
write_computation_times(
gallery_conf, target_dir, subsection_costs
)
# generate toctree with subsections
if gallery_conf["nested_sections"] is True:
subsections_toctree = _format_toctree(
subsection_index_files, includehidden=True)
# add toctree to file only if there are subsections
if len(subsection_index_files) > 0:
indexst += subsections_toctree
if gallery_conf['download_all_examples']:
download_fhindex = generate_zipfiles(
gallery_dir_abs_path, app.builder.srcdir
)
indexst += download_fhindex
if (app.config.sphinx_gallery_conf['show_signature']):
indexst += SPHX_GLR_SIG
if has_readme:
index_rst_new = os.path.join(gallery_dir_abs_path, 'index.rst.new')
with codecs.open(index_rst_new, 'w', encoding='utf-8') as fhindex:
fhindex.write(indexst)
_replace_md5(index_rst_new, mode='t')
if gallery_conf['show_api_usage'] is not False:
init_api_usage(app.builder.srcdir)
_finalize_backreferences(seen_backrefs, gallery_conf)
if gallery_conf['plot_gallery']:
logger.info("computation time summary:", color='white')
lines, lens = _format_for_writing(
costs, os.path.normpath(gallery_conf['src_dir']), kind='console')
for name, t, m in lines:
text = (' - %s: ' % (name,)).ljust(lens[0] + 10)
if t is None:
text += '(not run)'
logger.info(text)
else:
t_float = float(t.split()[0])
if t_float >= gallery_conf['min_reported_time']:
text += t.rjust(lens[1]) + ' ' + m.rjust(lens[2])
logger.info(text)
# Also create a junit.xml file, useful e.g. on CircleCI
write_junit_xml(gallery_conf, app.builder.outdir, costs)
SPHX_GLR_ORPHAN = """
:orphan:
.. _{0}:
"""
SPHX_GLR_COMP_TIMES = SPHX_GLR_ORPHAN + """
Computation times
=================
"""
def _sec_to_readable(t):
"""Convert a number of seconds to a more readable representation."""
# This will only work for < 1 day execution time
# And we reserve 2 digits for minutes because presumably
# there aren't many > 99 minute scripts, but occasionally some
# > 9 minute ones
t = datetime(1, 1, 1) + timedelta(seconds=t)
t = '{0:02d}:{1:02d}.{2:03d}'.format(
t.hour * 60 + t.minute, t.second,
int(round(t.microsecond / 1000.)))
return t
[docs]def cost_name_key(cost_name):
cost, name = cost_name
# sort by descending computation time, descending memory, alphabetical name
return (-cost[0], -cost[1], name)
def _format_for_writing(costs, path, kind='rst'):
lines = list()
for cost in sorted(costs, key=cost_name_key):
if kind == 'rst': # like in sg_execution_times
name = ':ref:`sphx_glr_{0}_{1}` (``{1}``)'.format(
path, os.path.basename(cost[1]))
t = _sec_to_readable(cost[0][0])
else: # like in generate_gallery
assert kind == 'console'
name = os.path.relpath(cost[1], path)
t = '%0.2f sec' % (cost[0][0],)
m = '{0:.1f} MB'.format(cost[0][1])
lines.append([name, t, m])
lens = [max(x) for x in zip(*[[len(item) for item in cost]
for cost in lines])]
return lines, lens
[docs]def write_computation_times(gallery_conf, target_dir, costs):
total_time = sum(cost[0][0] for cost in costs)
if total_time == 0:
return
target_dir_clean = os.path.relpath(
target_dir, gallery_conf['src_dir']).replace(os.path.sep, '_')
new_ref = 'sphx_glr_%s_sg_execution_times' % target_dir_clean
with codecs.open(os.path.join(target_dir, 'sg_execution_times.rst'), 'w',
encoding='utf-8') as fid:
fid.write(SPHX_GLR_COMP_TIMES.format(new_ref))
fid.write('**{0}** total execution time for **{1}** files:\n\n'
.format(_sec_to_readable(total_time), target_dir_clean))
lines, lens = _format_for_writing(costs, target_dir_clean)
del costs
hline = ''.join(('+' + '-' * (length + 2)) for length in lens) + '+\n'
fid.write(hline)
format_str = ''.join('| {%s} ' % (ii,)
for ii in range(len(lines[0]))) + '|\n'
for line in lines:
line = [ll.ljust(len_) for ll, len_ in zip(line, lens)]
text = format_str.format(*line)
assert len(text) == len(hline)
fid.write(text)
fid.write(hline)
[docs]def write_api_entries(app, what, name, obj, options, lines):
# sphinx-autoapi can do this before we manage to complete our config
if 'show_api_usage' not in app.config.sphinx_gallery_conf:
app.config.sphinx_gallery_conf['show_api_usage'] = False
if app.config.sphinx_gallery_conf['show_api_usage'] is False:
return
if '_sg_api_entries' not in app.config.sphinx_gallery_conf:
app.config.sphinx_gallery_conf['_sg_api_entries'] = dict()
if what not in app.config.sphinx_gallery_conf['_sg_api_entries']:
app.config.sphinx_gallery_conf['_sg_api_entries'][what] = set()
app.config.sphinx_gallery_conf['_sg_api_entries'][what].add(name)
[docs]def init_api_usage(gallery_dir):
with codecs.open(os.path.join(gallery_dir, 'sg_api_usage.rst'), 'w',
encoding='utf-8'):
pass
def _make_graph(fname, entries, gallery_conf):
"""Make a graph of unused and used API entries.
The used API entries themselves are documented in the list, so
for the graph, we'll focus on the number of unused API entries
per modules. Modules with lots of unused entries (11+) will be colored
red, those with less (6+) will be colored orange, those with only a few
(1-5) will be colored yellow and those with no unused entries will be
colored blue.
The API entries that are used are shown with one graph per module.
That way you can see the examples that each API entry is used in
for that module (if this was done for the whole project at once,
the graph would get too large very large quickly).
"""
import graphviz
dg = graphviz.Digraph(filename=fname,
node_attr={'color': 'lightblue2',
'style': 'filled',
'fontsize': '40'})
if isinstance(entries, list):
connections = set()
lut = dict() # look up table for connections so they don't repeat
structs = [entry.split('.') for entry in entries]
for struct in sorted(structs, key=len):
for level in range(len(struct) - 2):
if (struct[level], struct[level + 1]) in connections:
continue
connections.add((struct[level], struct[level + 1]))
node_from = lut[struct[level]] if \
struct[level] in lut else struct[level]
dg.attr('node', color='lightblue2')
dg.node(node_from)
node_to = struct[level + 1]
# count, don't show leaves
if len(struct) - 3 == level:
leaf_count = 0
for struct2 in structs:
# find structures of the same length as struct
if len(struct2) != level + 3:
continue
# find structures with two entries before
# the leaf that are the same as struct
if all([struct2[level2] == struct[level2]
for level2 in range(level + 2)]):
leaf_count += 1
node_to += f'\n({leaf_count})'
lut[struct[level + 1]] = node_to
if leaf_count > 10:
color = 'red'
elif leaf_count > 5:
color = 'orange'
else:
color = 'yellow'
dg.attr('node', color=color)
else:
dg.attr('node', color='lightblue2')
dg.node(node_to)
dg.edge(node_from, node_to)
# add modules with all API entries
dg.attr('node', color='lightblue2')
for module in gallery_conf['_sg_api_entries']['module']:
struct = module.split('.')
for i in range(len(struct) - 1):
if struct[i + 1] not in lut:
dg.edge(struct[i], struct[i + 1])
else:
assert isinstance(entries, dict)
for entry, refs in entries.items():
dg.attr('node', color='lightblue2')
dg.node(entry)
dg.attr('node', color='yellow')
for ref in refs:
dg.node(ref)
dg.edge(entry, ref)
dg.attr(overlap='scale')
dg.save(fname)
[docs]def write_api_entry_usage(app, docname, source):
"""Write an html page describing which API entries are used and unused.
To document and graph only those API entries that are used by
autodoc, we have to wait for autodoc to finish and hook into the
``source-read`` event. This intercepts the text from the rst such
that it can be modified. Since, we only touched an empty file,
we have to add 1) a list of all the API entries that are unused
and a graph of the number of unused API entries per module and 2)
a list of API entries that are used in examples, each with a sub-list
of which examples that API entry is used in, and a graph that
connects all of the API entries in a module to the examples
that they are used in.
"""
gallery_conf = app.config.sphinx_gallery_conf
if gallery_conf['show_api_usage'] is False:
return
# since this is done at the gallery directory level (as opposed
# to in a gallery directory, e.g. auto_examples), it runs last
# which means that all the api entries will be in gallery_conf
if 'sg_api_usage' not in docname or \
'_sg_api_entries' not in gallery_conf or \
gallery_conf['backreferences_dir'] is None:
return
backreferences_dir = os.path.join(gallery_conf['src_dir'],
gallery_conf['backreferences_dir'])
example_files = set.union(
*[gallery_conf['_sg_api_entries'][obj_type]
for obj_type in ('class', 'method', 'function')
if obj_type in gallery_conf['_sg_api_entries']])
if len(example_files) == 0:
return
def get_entry_type(entry):
if entry in gallery_conf['_sg_api_entries'].get('class', []):
return 'class'
elif entry in gallery_conf['_sg_api_entries'].get('method', []):
return 'meth'
else:
assert entry in gallery_conf['_sg_api_entries']['function']
return 'func'
# find used and unused API entries
unused_api_entries = list()
used_api_entries = dict()
for entry in example_files:
# don't include built-in methods etc.
if re.match(gallery_conf['api_usage_ignore'], entry) is not None:
continue
# check if backreferences empty
example_fname = os.path.join(
backreferences_dir, f'{entry}.examples.new')
if not os.path.isfile(example_fname): # use without new
example_fname = os.path.splitext(example_fname)[0]
assert os.path.isfile(example_fname)
if os.path.getsize(example_fname) == 0:
unused_api_entries.append(entry)
else:
used_api_entries[entry] = list()
with open(example_fname, 'r', encoding='utf-8') as fid2:
for line in fid2:
if line.startswith(' :ref:'):
example_name = line.split('`')[1]
used_api_entries[entry].append(
example_name)
source[0] = SPHX_GLR_ORPHAN.format('sphx_glr_sg_api_usage')
title = 'Unused API Entries'
source[0] += title + '\n' + '^' * len(title) + '\n\n'
for entry in sorted(unused_api_entries):
source[0] += f'- :{get_entry_type(entry)}:`{entry}`\n'
source[0] += '\n\n'
has_graphviz = _has_graphviz()
if has_graphviz and unused_api_entries:
source[0] += ('.. graphviz:: ./sg_api_unused.dot\n'
' :alt: API unused entries graph\n'
' :layout: neato\n\n')
used_count = len(used_api_entries)
total_count = used_count + len(unused_api_entries)
used_percentage = used_count / max(total_count, 1) # avoid div by zero
source[0] += ('\nAPI entries used: '
f'{round(used_percentage * 100, 2)}% '
f'({used_count}/{total_count})\n\n')
if has_graphviz and unused_api_entries:
_make_graph(os.path.join(app.builder.srcdir, 'sg_api_unused.dot'),
unused_api_entries, gallery_conf)
if gallery_conf['show_api_usage'] is True and used_api_entries:
title = 'Used API Entries'
source[0] += title + '\n' + '^' * len(title) + '\n\n'
for entry in sorted(used_api_entries):
source[0] += f'- :{get_entry_type(entry)}:`{entry}`\n\n'
for ref in used_api_entries[entry]:
source[0] += f' - :ref:`{ref}`\n'
source[0] += '\n\n'
if has_graphviz:
used_modules = set([entry.split('.')[0]
for entry in used_api_entries])
for module in sorted(used_modules):
source[0] += (
f'{module}\n' + '^' * len(module) + '\n\n'
f'.. graphviz:: ./{module}_sg_api_used.dot\n'
f' :alt: {module} usage graph\n'
' :layout: neato\n\n')
for module in used_modules:
logger.info(f'Making API usage graph for {module}')
# select and format entries for this module
entries = dict()
for entry, ref in used_api_entries.items():
if entry.split('.')[0] == module:
entry = entry.replace('sphx_glr_', '')
# remove prefix
for target_dir in gallery_conf['gallery_dirs']:
if entry.startswith(target_dir):
entry = entry[len(target_dir) + 1:]
_make_graph(os.path.join(app.builder.srcdir,
f'{module}_sg_api_used.dot'),
entries, gallery_conf)
[docs]def clean_files(app, exception):
if os.path.isfile(os.path.join(app.builder.srcdir, 'sg_api_usage.rst')):
os.remove(os.path.join(app.builder.srcdir, 'sg_api_usage.rst'))
if os.path.isfile(os.path.join(app.builder.srcdir, 'sg_api_unused.dot')):
os.remove(os.path.join(app.builder.srcdir, 'sg_api_unused.dot'))
for file in os.listdir(app.builder.srcdir):
if 'sg_api_used.dot' in file:
os.remove(os.path.join(app.builder.srcdir, file))
[docs]def write_junit_xml(gallery_conf, target_dir, costs):
if not gallery_conf['junit'] or not gallery_conf['plot_gallery']:
return
failing_as_expected, failing_unexpectedly, passing_unexpectedly = \
_parse_failures(gallery_conf)
n_tests = 0
n_failures = 0
n_skips = 0
elapsed = 0.
src_dir = gallery_conf['src_dir']
output = ''
for cost in costs:
(t, _), fname = cost
if not any(fname in x for x in (gallery_conf['passing_examples'],
failing_unexpectedly,
failing_as_expected,
passing_unexpectedly)):
continue # not subselected by our regex
title = gallery_conf['titles'][fname]
output += (
u'<testcase classname={0!s} file={1!s} line="1" '
u'name={2!s} time="{3!r}">'
.format(quoteattr(os.path.splitext(os.path.basename(fname))[0]),
quoteattr(os.path.relpath(fname, src_dir)),
quoteattr(title), t))
if fname in failing_as_expected:
output += u'<skipped message="expected example failure"></skipped>'
n_skips += 1
elif fname in failing_unexpectedly or fname in passing_unexpectedly:
if fname in failing_unexpectedly:
traceback = gallery_conf['failing_examples'][fname]
else: # fname in passing_unexpectedly
traceback = 'Passed even though it was marked to fail'
n_failures += 1
output += (u'<failure message={0!s}>{1!s}</failure>'
.format(quoteattr(traceback.splitlines()[-1].strip()),
escape(traceback)))
output += u'</testcase>'
n_tests += 1
elapsed += t
output += u'</testsuite>'
output = (u'<?xml version="1.0" encoding="utf-8"?>'
u'<testsuite errors="0" failures="{0}" name="sphinx-gallery" '
u'skipped="{1}" tests="{2}" time="{3}">'
.format(n_failures, n_skips, n_tests, elapsed)) + output
# Actually write it
fname = os.path.normpath(os.path.join(target_dir, gallery_conf['junit']))
junit_dir = os.path.dirname(fname)
if not os.path.isdir(junit_dir):
os.makedirs(junit_dir)
with codecs.open(fname, 'w', encoding='utf-8') as fid:
fid.write(output)
[docs]def touch_empty_backreferences(app, what, name, obj, options, lines):
"""Generate empty back-reference example files.
This avoids inclusion errors/warnings if there are no gallery
examples for a class / module that is being parsed by autodoc"""
if not bool(app.config.sphinx_gallery_conf['backreferences_dir']):
return
examples_path = os.path.join(app.srcdir,
app.config.sphinx_gallery_conf[
"backreferences_dir"],
"%s.examples" % name)
if not os.path.exists(examples_path):
# touch file
open(examples_path, 'w').close()
def _expected_failing_examples(gallery_conf):
return set(
os.path.normpath(os.path.join(gallery_conf['src_dir'], path))
for path in gallery_conf['expected_failing_examples'])
def _parse_failures(gallery_conf):
"""Split the failures."""
failing_examples = set(gallery_conf['failing_examples'].keys())
expected_failing_examples = _expected_failing_examples(gallery_conf)
failing_as_expected = failing_examples.intersection(
expected_failing_examples)
failing_unexpectedly = failing_examples.difference(
expected_failing_examples)
passing_unexpectedly = expected_failing_examples.difference(
failing_examples)
# filter from examples actually run
passing_unexpectedly = [
src_file for src_file in passing_unexpectedly
if re.search(gallery_conf.get('filename_pattern'), src_file)]
return failing_as_expected, failing_unexpectedly, passing_unexpectedly
[docs]def summarize_failing_examples(app, exception):
"""Collects the list of falling examples and prints them with a traceback.
Raises ValueError if there where failing examples.
"""
if exception is not None:
return
# Under no-plot Examples are not run so nothing to summarize
if not app.config.sphinx_gallery_conf['plot_gallery']:
logger.info('Sphinx-Gallery gallery_conf["plot_gallery"] was '
'False, so no examples were executed.', color='brown')
return
gallery_conf = app.config.sphinx_gallery_conf
failing_as_expected, failing_unexpectedly, passing_unexpectedly = \
_parse_failures(gallery_conf)
if failing_as_expected:
logger.info("Examples failing as expected:", color='brown')
for fail_example in failing_as_expected:
logger.info('%s failed leaving traceback:', fail_example,
color='brown')
logger.info(gallery_conf['failing_examples'][fail_example],
color='brown')
fail_msgs = []
if failing_unexpectedly:
fail_msgs.append(red("Unexpected failing examples:"))
for fail_example in failing_unexpectedly:
fail_msgs.append(fail_example + ' failed leaving traceback:\n' +
gallery_conf['failing_examples'][fail_example] +
'\n')
if passing_unexpectedly:
fail_msgs.append(red("Examples expected to fail, but not failing:\n") +
"Please remove these examples from\n" +
"sphinx_gallery_conf['expected_failing_examples']\n" +
"in your conf.py file"
"\n".join(passing_unexpectedly))
# standard message
n_good = len(gallery_conf['passing_examples'])
n_tot = len(gallery_conf['failing_examples']) + n_good
n_stale = len(gallery_conf['stale_examples'])
logger.info('\nSphinx-Gallery successfully executed %d out of %d '
'file%s subselected by:\n\n'
' gallery_conf["filename_pattern"] = %r\n'
' gallery_conf["ignore_pattern"] = %r\n'
'\nafter excluding %d file%s that had previously been run '
'(based on MD5).\n'
% (n_good, n_tot, 's' if n_tot != 1 else '',
gallery_conf['filename_pattern'],
gallery_conf['ignore_pattern'],
n_stale, 's' if n_stale != 1 else '',
),
color='brown')
if fail_msgs:
fail_message = ("Here is a summary of the problems encountered "
"when running the examples\n\n" +
"\n".join(fail_msgs) + "\n" + "-" * 79)
if gallery_conf['only_warn_on_example_error']:
logger.warning(fail_message)
else:
raise ExtensionError(fail_message)
[docs]def collect_gallery_files(examples_dirs, gallery_conf):
"""Collect python files from the gallery example directories."""
files = []
for example_dir in examples_dirs:
for root, dirnames, filenames in os.walk(example_dir):
for filename in filenames:
if filename.endswith('.py'):
if re.search(gallery_conf['ignore_pattern'],
filename) is None:
files.append(os.path.join(root, filename))
return files
[docs]def check_duplicate_filenames(files):
"""Check for duplicate filenames across gallery directories."""
# Check whether we'll have duplicates
used_names = set()
dup_names = list()
for this_file in files:
this_fname = os.path.basename(this_file)
if this_fname in used_names:
dup_names.append(this_file)
else:
used_names.add(this_fname)
if len(dup_names) > 0:
logger.warning(
'Duplicate example file name(s) found. Having duplicate file '
'names will break some links. '
'List of files: {}'.format(sorted(dup_names),))
[docs]def check_spaces_in_filenames(files):
"""Check for spaces in filenames across example directories."""
regex = re.compile(r'[\s]')
files_with_space = list(filter(regex.search, files))
if files_with_space:
logger.warning(
'Example file name(s) with space(s) found. Having space(s) in '
'file names will break some links. '
'List of files: {}'.format(sorted(files_with_space),))
[docs]def get_default_config_value(key):
def default_getter(conf):
return conf['sphinx_gallery_conf'].get(key, DEFAULT_GALLERY_CONF[key])
return default_getter
[docs]def setup(app):
"""Setup Sphinx-Gallery sphinx extension"""
app.add_config_value('sphinx_gallery_conf', DEFAULT_GALLERY_CONF, 'html')
for key in ['plot_gallery', 'abort_on_example_error']:
app.add_config_value(key, get_default_config_value(key), 'html')
# set small priority value, so that pre_configure_jupyterlite_sphinx is
# called before jupyterlite_sphinx config-inited
app.connect(
'config-inited', pre_configure_jupyterlite_sphinx, priority=100)
# set high priority value, so that post_configure_jupyterlite_sphinx is
# called after jupyterlite_sphinx config-inited
app.connect(
'config-inited', post_configure_jupyterlite_sphinx, priority=900)
if 'sphinx.ext.autodoc' in app.extensions:
app.connect('autodoc-process-docstring', touch_empty_backreferences)
app.connect('autodoc-process-docstring', write_api_entries)
app.connect('source-read', write_api_entry_usage)
# Add the custom directive
app.add_directive('minigallery', MiniGallery)
app.add_directive("image-sg", ImageSg)
imagesg_addnode(app)
app.connect('builder-inited', generate_gallery_rst)
app.connect('build-finished', copy_binder_files)
app.connect('build-finished', create_jupyterlite_contents)
app.connect('build-finished', summarize_failing_examples)
app.connect('build-finished', embed_code_links)
app.connect('build-finished', clean_files)
metadata = {'parallel_read_safe': True,
'parallel_write_safe': True,
'version': _sg_version}
return metadata
[docs]def setup_module():
# HACK: Stop nosetests running setup() above
pass