# Licensed under the Apache License: http://www.apache.org/licenses/LICENSE-2.0 # For details: https://github.com/nedbat/coveragepy/blob/master/NOTICE.txt """HTML reporting for coverage.py.""" from __future__ import annotations import collections import dataclasses import datetime import functools import json import os import re import string from dataclasses import dataclass, field from typing import Any, TYPE_CHECKING from collections.abc import Iterable import coverage from coverage.data import CoverageData, add_data_to_hash from coverage.exceptions import NoDataError from coverage.files import flat_rootname from coverage.misc import ( ensure_dir, file_be_gone, Hasher, isolate_module, format_local_datetime, human_sorted, plural, stdout_link, ) from coverage.report_core import get_analysis_to_report from coverage.results import Analysis, Numbers from coverage.templite import Templite from coverage.types import TLineNo, TMorf from coverage.version import __url__ if TYPE_CHECKING: from coverage import Coverage from coverage.plugins import FileReporter os = isolate_module(os) def data_filename(fname: str) -> str: """Return the path to an "htmlfiles" data file of ours. """ static_dir = os.path.join(os.path.dirname(__file__), "htmlfiles") static_filename = os.path.join(static_dir, fname) return static_filename def read_data(fname: str) -> str: """Return the contents of a data file of ours.""" with open(data_filename(fname)) as data_file: return data_file.read() def write_html(fname: str, html: str) -> None: """Write `html` to `fname`, properly encoded.""" html = re.sub(r"(\A\s+)|(\s+$)", "", html, flags=re.MULTILINE) + "\n" with open(fname, "wb") as fout: fout.write(html.encode("ascii", "xmlcharrefreplace")) @dataclass class LineData: """The data for each source line of HTML output.""" tokens: list[tuple[str, str]] number: TLineNo category: str contexts: list[str] contexts_label: str context_list: list[str] short_annotations: list[str] long_annotations: list[str] html: str = "" context_str: str | None = None annotate: str | None = None annotate_long: str | None = None css_class: str = "" @dataclass class FileData: """The data for each source file of HTML output.""" relative_filename: str nums: Numbers lines: list[LineData] @dataclass class IndexItem: """Information for each index entry, to render an index page.""" url: str = "" file: str = "" description: str = "" nums: Numbers = field(default_factory=Numbers) @dataclass class IndexPage: """Data for each index page.""" noun: str plural: str filename: str summaries: list[IndexItem] totals: Numbers skipped_covered_count: int skipped_empty_count: int class HtmlDataGeneration: """Generate structured data to be turned into HTML reports.""" EMPTY = "(empty)" def __init__(self, cov: Coverage) -> None: self.coverage = cov self.config = self.coverage.config self.data = self.coverage.get_data() self.has_arcs = self.data.has_arcs() if self.config.show_contexts: if self.data.measured_contexts() == {""}: self.coverage._warn("No contexts were measured") self.data.set_query_contexts(self.config.report_contexts) def data_for_file(self, fr: FileReporter, analysis: Analysis) -> FileData: """Produce the data needed for one file's report.""" if self.has_arcs: missing_branch_arcs = analysis.missing_branch_arcs() arcs_executed = analysis.arcs_executed else: missing_branch_arcs = {} arcs_executed = [] if self.config.show_contexts: contexts_by_lineno = self.data.contexts_by_lineno(analysis.filename) lines = [] branch_stats = analysis.branch_stats() for lineno, tokens in enumerate(fr.source_token_lines(), start=1): # Figure out how to mark this line. category = "" short_annotations = [] long_annotations = [] if lineno in analysis.excluded: category = "exc" elif lineno in analysis.missing: category = "mis" elif self.has_arcs and lineno in missing_branch_arcs: category = "par" mba = missing_branch_arcs[lineno] if len(mba) == branch_stats[lineno][0]: # None of the branches were taken from this line. short_annotations.append("anywhere") long_annotations.append( f"line {lineno} didn't jump anywhere: it always raised an exception." ) else: for b in missing_branch_arcs[lineno]: if b < 0: short_annotations.append("exit") else: short_annotations.append(str(b)) long_annotations.append( fr.missing_arc_description(lineno, b, arcs_executed) ) elif lineno in analysis.statements: category = "run" contexts = [] contexts_label = "" context_list = [] if category and self.config.show_contexts: contexts = human_sorted(c or self.EMPTY for c in contexts_by_lineno.get(lineno, ())) if contexts == [self.EMPTY]: contexts_label = self.EMPTY else: contexts_label = f"{len(contexts)} ctx" context_list = contexts lines.append(LineData( tokens=tokens, number=lineno, category=category, contexts=contexts, contexts_label=contexts_label, context_list=context_list, short_annotations=short_annotations, long_annotations=long_annotations, )) file_data = FileData( relative_filename=fr.relative_filename(), nums=analysis.numbers, lines=lines, ) return file_data class FileToReport: """A file we're considering reporting.""" def __init__(self, fr: FileReporter, analysis: Analysis) -> None: self.fr = fr self.analysis = analysis self.rootname = flat_rootname(fr.relative_filename()) self.html_filename = self.rootname + ".html" self.prev_html = self.next_html = "" HTML_SAFE = string.ascii_letters + string.digits + "!#$%'()*+,-./:;=?@[]^_`{|}~" @functools.cache def encode_int(n: int) -> str: """Create a short HTML-safe string from an integer, using HTML_SAFE.""" if n == 0: return HTML_SAFE[0] r = [] while n: n, t = divmod(n, len(HTML_SAFE)) r.append(HTML_SAFE[t]) return "".join(r) def copy_with_cache_bust(src: str, dest_dir: str) -> str: """Copy `src` to `dest_dir`, adding a hash to the name. Returns the updated destination file name with hash. """ with open(src, "rb") as f: text = f.read() h = Hasher() h.update(text) cache_bust = h.hexdigest()[:8] src_base = os.path.basename(src) dest = src_base.replace(".", f"_cb_{cache_bust}.") with open(os.path.join(dest_dir, dest), "wb") as f: f.write(text) return dest class HtmlReporter: """HTML reporting.""" # These files will be copied from the htmlfiles directory to the output # directory. STATIC_FILES = [ "style.css", "coverage_html.js", "keybd_closed.png", "favicon_32.png", ] def __init__(self, cov: Coverage) -> None: self.coverage = cov self.config = self.coverage.config self.directory = self.config.html_dir self.skip_covered = self.config.html_skip_covered if self.skip_covered is None: self.skip_covered = self.config.skip_covered self.skip_empty = self.config.html_skip_empty if self.skip_empty is None: self.skip_empty = self.config.skip_empty title = self.config.html_title self.extra_css = bool(self.config.extra_css) self.data = self.coverage.get_data() self.has_arcs = self.data.has_arcs() self.index_pages: dict[str, IndexPage] = { "file": self.new_index_page("file", "files"), } self.incr = IncrementalChecker(self.directory) self.datagen = HtmlDataGeneration(self.coverage) self.directory_was_empty = False self.first_fr = None self.final_fr = None self.template_globals = { # Functions available in the templates. "escape": escape, "pair": pair, "len": len, # Constants for this report. "__url__": __url__, "__version__": coverage.__version__, "title": title, "time_stamp": format_local_datetime(datetime.datetime.now()), "extra_css": self.extra_css, "has_arcs": self.has_arcs, "show_contexts": self.config.show_contexts, "statics": {}, # Constants for all reports. # These css classes determine which lines are highlighted by default. "category": { "exc": "exc show_exc", "mis": "mis show_mis", "par": "par run show_par", "run": "run", }, } self.index_tmpl = Templite(read_data("index.html"), self.template_globals) self.pyfile_html_source = read_data("pyfile.html") self.source_tmpl = Templite(self.pyfile_html_source, self.template_globals) def new_index_page(self, noun: str, plural_noun: str) -> IndexPage: """Create an IndexPage for a kind of region.""" return IndexPage( noun=noun, plural=plural_noun, filename="index.html" if noun == "file" else f"{noun}_index.html", summaries=[], totals=Numbers(precision=self.config.precision), skipped_covered_count=0, skipped_empty_count=0, ) def report(self, morfs: Iterable[TMorf] | None) -> float: """Generate an HTML report for `morfs`. `morfs` is a list of modules or file names. """ # Read the status data and check that this run used the same # global data as the last run. self.incr.read() self.incr.check_global_data(self.config, self.pyfile_html_source) # Process all the files. For each page we need to supply a link # to the next and previous page. files_to_report = [] have_data = False for fr, analysis in get_analysis_to_report(self.coverage, morfs): have_data = True ftr = FileToReport(fr, analysis) if self.should_report(analysis, self.index_pages["file"]): files_to_report.append(ftr) else: file_be_gone(os.path.join(self.directory, ftr.html_filename)) if not have_data: raise NoDataError("No data to report.") self.make_directory() self.make_local_static_report_files() if files_to_report: for ftr1, ftr2 in zip(files_to_report[:-1], files_to_report[1:]): ftr1.next_html = ftr2.html_filename ftr2.prev_html = ftr1.html_filename files_to_report[0].prev_html = "index.html" files_to_report[-1].next_html = "index.html" for ftr in files_to_report: self.write_html_page(ftr) for noun, plural_noun in ftr.fr.code_region_kinds(): if noun not in self.index_pages: self.index_pages[noun] = self.new_index_page(noun, plural_noun) # Write the index page. if files_to_report: first_html = files_to_report[0].html_filename final_html = files_to_report[-1].html_filename else: first_html = final_html = "index.html" self.write_file_index_page(first_html, final_html) # Write function and class index pages. self.write_region_index_pages(files_to_report) return ( self.index_pages["file"].totals.n_statements and self.index_pages["file"].totals.pc_covered ) def make_directory(self) -> None: """Make sure our htmlcov directory exists.""" ensure_dir(self.directory) if not os.listdir(self.directory): self.directory_was_empty = True def copy_static_file(self, src: str, slug: str = "") -> None: """Copy a static file into the output directory with cache busting.""" dest = copy_with_cache_bust(src, self.directory) if not slug: slug = os.path.basename(src).replace(".", "_") self.template_globals["statics"][slug] = dest # type: ignore def make_local_static_report_files(self) -> None: """Make local instances of static files for HTML report.""" # The files we provide must always be copied. for static in self.STATIC_FILES: self.copy_static_file(data_filename(static)) # The user may have extra CSS they want copied. if self.extra_css: assert self.config.extra_css is not None self.copy_static_file(self.config.extra_css, slug="extra_css") # Only write the .gitignore file if the directory was originally empty. # .gitignore can't be copied from the source tree because if it was in # the source tree, it would stop the static files from being checked in. if self.directory_was_empty: with open(os.path.join(self.directory, ".gitignore"), "w") as fgi: fgi.write("# Created by coverage.py\n*\n") def should_report(self, analysis: Analysis, index_page: IndexPage) -> bool: """Determine if we'll report this file or region.""" # Get the numbers for this file. nums = analysis.numbers index_page.totals += nums if self.skip_covered: # Don't report on 100% files. no_missing_lines = (nums.n_missing == 0) no_missing_branches = (nums.n_partial_branches == 0) if no_missing_lines and no_missing_branches: index_page.skipped_covered_count += 1 return False if self.skip_empty: # Don't report on empty files. if nums.n_statements == 0: index_page.skipped_empty_count += 1 return False return True def write_html_page(self, ftr: FileToReport) -> None: """Generate an HTML page for one source file. If the page on disk is already correct based on our incremental status checking, then the page doesn't have to be generated, and this function only does page summary bookkeeping. """ # Find out if the page on disk is already correct. if self.incr.can_skip_file(self.data, ftr.fr, ftr.rootname): self.index_pages["file"].summaries.append(self.incr.index_info(ftr.rootname)) return # Write the HTML page for this source file. file_data = self.datagen.data_for_file(ftr.fr, ftr.analysis) contexts = collections.Counter(c for cline in file_data.lines for c in cline.contexts) context_codes = {y: i for (i, y) in enumerate(x[0] for x in contexts.most_common())} if context_codes: contexts_json = json.dumps( {encode_int(v): k for (k, v) in context_codes.items()}, indent=2, ) else: contexts_json = None for ldata in file_data.lines: # Build the HTML for the line. html_parts = [] for tok_type, tok_text in ldata.tokens: if tok_type == "ws": html_parts.append(escape(tok_text)) else: tok_html = escape(tok_text) or " " html_parts.append(f'{tok_html}') ldata.html = "".join(html_parts) if ldata.context_list: encoded_contexts = [ encode_int(context_codes[c_context]) for c_context in ldata.context_list ] code_width = max(len(ec) for ec in encoded_contexts) ldata.context_str = ( str(code_width) + "".join(ec.ljust(code_width) for ec in encoded_contexts) ) else: ldata.context_str = "" if ldata.short_annotations: # 202F is NARROW NO-BREAK SPACE. # 219B is RIGHTWARDS ARROW WITH STROKE. ldata.annotate = ",   ".join( f"{ldata.number} ↛ {d}" for d in ldata.short_annotations ) else: ldata.annotate = None if ldata.long_annotations: longs = ldata.long_annotations # A line can only have two branch destinations. If there were # two missing, we would have written one as "always raised." assert len(longs) == 1, ( f"Had long annotations in {ftr.fr.relative_filename()}: {longs}" ) ldata.annotate_long = longs[0] else: ldata.annotate_long = None css_classes = [] if ldata.category: css_classes.append( self.template_globals["category"][ldata.category], # type: ignore[index] ) ldata.css_class = " ".join(css_classes) or "pln" html_path = os.path.join(self.directory, ftr.html_filename) html = self.source_tmpl.render({ **file_data.__dict__, "contexts_json": contexts_json, "prev_html": ftr.prev_html, "next_html": ftr.next_html, }) write_html(html_path, html) # Save this file's information for the index page. index_info = IndexItem( url = ftr.html_filename, file = escape(ftr.fr.relative_filename()), nums = ftr.analysis.numbers, ) self.index_pages["file"].summaries.append(index_info) self.incr.set_index_info(ftr.rootname, index_info) def write_file_index_page(self, first_html: str, final_html: str) -> None: """Write the file index page for this report.""" index_file = self.write_index_page( self.index_pages["file"], first_html=first_html, final_html=final_html, ) print_href = stdout_link(index_file, f"file://{os.path.abspath(index_file)}") self.coverage._message(f"Wrote HTML report to {print_href}") # Write the latest hashes for next time. self.incr.write() def write_region_index_pages(self, files_to_report: Iterable[FileToReport]) -> None: """Write the other index pages for this report.""" for ftr in files_to_report: region_nouns = [pair[0] for pair in ftr.fr.code_region_kinds()] num_lines = len(ftr.fr.source().splitlines()) regions = ftr.fr.code_regions() for noun in region_nouns: page_data = self.index_pages[noun] outside_lines = set(range(1, num_lines + 1)) for region in regions: if region.kind != noun: continue outside_lines -= region.lines analysis = ftr.analysis.narrow(region.lines) if not self.should_report(analysis, page_data): continue sorting_name = region.name.rpartition(".")[-1].lstrip("_") page_data.summaries.append(IndexItem( url=f"{ftr.html_filename}#t{region.start}", file=escape(ftr.fr.relative_filename()), description=( f"" + escape(region.name) + "" ), nums=analysis.numbers, )) analysis = ftr.analysis.narrow(outside_lines) if self.should_report(analysis, page_data): page_data.summaries.append(IndexItem( url=ftr.html_filename, file=escape(ftr.fr.relative_filename()), description=( "" + f"(no {escape(noun)})" + "" ), nums=analysis.numbers, )) for noun, index_page in self.index_pages.items(): if noun != "file": self.write_index_page(index_page) def write_index_page(self, index_page: IndexPage, **kwargs: str) -> str: """Write an index page specified by `index_page`. Returns the filename created. """ skipped_covered_msg = skipped_empty_msg = "" if n := index_page.skipped_covered_count: word = plural(n, index_page.noun, index_page.plural) skipped_covered_msg = f"{n} {word} skipped due to complete coverage." if n := index_page.skipped_empty_count: word = plural(n, index_page.noun, index_page.plural) skipped_empty_msg = f"{n} empty {word} skipped." index_buttons = [ { "label": ip.plural.title(), "url": ip.filename if ip.noun != index_page.noun else "", "current": ip.noun == index_page.noun, } for ip in self.index_pages.values() ] render_data = { "regions": index_page.summaries, "totals": index_page.totals, "noun": index_page.noun, "region_noun": index_page.noun if index_page.noun != "file" else "", "skip_covered": self.skip_covered, "skipped_covered_msg": skipped_covered_msg, "skipped_empty_msg": skipped_empty_msg, "first_html": "", "final_html": "", "index_buttons": index_buttons, } render_data.update(kwargs) html = self.index_tmpl.render(render_data) index_file = os.path.join(self.directory, index_page.filename) write_html(index_file, html) return index_file @dataclass class FileInfo: """Summary of the information from last rendering, to avoid duplicate work.""" hash: str = "" index: IndexItem = field(default_factory=IndexItem) class IncrementalChecker: """Logic and data to support incremental reporting. When generating an HTML report, often only a few of the source files have changed since the last time we made the HTML report. This means previously created HTML pages can be reused without generating them again, speeding the command. This class manages a JSON data file that captures enough information to know whether an HTML page for a .py file needs to be regenerated or not. The data file also needs to store all the information needed to create the entry for the file on the index page so that if the HTML page is reused, the index page can still be created to refer to it. The data looks like:: { "note": "This file is an internal implementation detail ...", // A fixed number indicating the data format. STATUS_FORMAT "format": 5, // The version of coverage.py "version": "7.4.4", // A hash of a number of global things, including the configuration // settings and the pyfile.html template itself. "globals": "540ee119c15d52a68a53fe6f0897346d", "files": { // An entry for each source file keyed by the flat_rootname(). "z_7b071bdc2a35fa80___init___py": { // Hash of the source, the text of the .py file. "hash": "e45581a5b48f879f301c0f30bf77a50c", // Information for the index.html file. "index": { "url": "z_7b071bdc2a35fa80___init___py.html", "file": "cogapp/__init__.py", "description": "", // The Numbers for this file. "nums": { "precision": 2, "n_files": 1, "n_statements": 43, ... } } }, ... } } """ STATUS_FILE = "status.json" STATUS_FORMAT = 5 NOTE = ( "This file is an internal implementation detail to speed up HTML report" + " generation. Its format can change at any time. You might be looking" + " for the JSON report: https://coverage.rtfd.io/cmd.html#cmd-json" ) def __init__(self, directory: str) -> None: self.directory = directory self._reset() def _reset(self) -> None: """Initialize to empty. Causes all files to be reported.""" self.globals = "" self.files: dict[str, FileInfo] = {} def read(self) -> None: """Read the information we stored last time.""" try: status_file = os.path.join(self.directory, self.STATUS_FILE) with open(status_file) as fstatus: status = json.load(fstatus) except (OSError, ValueError): # Status file is missing or malformed. usable = False else: if status["format"] != self.STATUS_FORMAT: usable = False elif status["version"] != coverage.__version__: usable = False else: usable = True if usable: self.files = {} for filename, filedict in status["files"].items(): indexdict = filedict["index"] index_item = IndexItem(**indexdict) index_item.nums = Numbers(**indexdict["nums"]) fileinfo = FileInfo( hash=filedict["hash"], index=index_item, ) self.files[filename] = fileinfo self.globals = status["globals"] else: self._reset() def write(self) -> None: """Write the current status.""" status_file = os.path.join(self.directory, self.STATUS_FILE) status_data = { "note": self.NOTE, "format": self.STATUS_FORMAT, "version": coverage.__version__, "globals": self.globals, "files": { fname: dataclasses.asdict(finfo) for fname, finfo in self.files.items() }, } with open(status_file, "w") as fout: json.dump(status_data, fout, separators=(",", ":")) def check_global_data(self, *data: Any) -> None: """Check the global data that can affect incremental reporting. Pass in whatever global information could affect the content of the HTML pages. If the global data has changed since last time, this will clear the data so that all files are regenerated. """ m = Hasher() for d in data: m.update(d) these_globals = m.hexdigest() if self.globals != these_globals: self._reset() self.globals = these_globals def can_skip_file(self, data: CoverageData, fr: FileReporter, rootname: str) -> bool: """Can we skip reporting this file? `data` is a CoverageData object, `fr` is a `FileReporter`, and `rootname` is the name being used for the file. Returns True if the HTML page is fine as-is, False if we need to recreate the HTML page. """ m = Hasher() m.update(fr.source().encode("utf-8")) add_data_to_hash(data, fr.filename, m) this_hash = m.hexdigest() file_info = self.files.setdefault(rootname, FileInfo()) if this_hash == file_info.hash: # Nothing has changed to require the file to be reported again. return True else: # File has changed, record the latest hash and force regeneration. file_info.hash = this_hash return False def index_info(self, fname: str) -> IndexItem: """Get the information for index.html for `fname`.""" return self.files.get(fname, FileInfo()).index def set_index_info(self, fname: str, info: IndexItem) -> None: """Set the information for index.html for `fname`.""" self.files.setdefault(fname, FileInfo()).index = info # Helpers for templates and generating HTML def escape(t: str) -> str: """HTML-escape the text in `t`. This is only suitable for HTML text, not attributes. """ # Convert HTML special chars into HTML entities. return t.replace("&", "&").replace("<", "<") def pair(ratio: tuple[int, int]) -> str: """Format a pair of numbers so JavaScript can read them in an attribute.""" return "{} {}".format(*ratio)