Skip to content

Commit

Permalink
test: Add code to test the documentation examples
Browse files Browse the repository at this point in the history
This code has been subject to considerable work to get it into this
form. However, it did not seem useful to retain the various approaches
and versions of the code before this state.

A quick guide to this code:

* It finds any Markdown files in `docs/`.
* It uses the SuperFences extension, as we do in the MkDocs
  configuration, to extract Markdown code blocks labelled with `ehrql`
  syntax. These are assumed to be self-contained dataset definitions.
* The code blocks that will be tested should appear as code blocks in
  the documentation, by default (provided the CSS isn't changed to
  modify the appearance of code blocks somehow, which shouldn't be the
  case, because why would you?). They are identified in the parametrized
  tests by their ordinal fence number in the source file.
* It finds any Python modules indicated by a `.py` extension. Python
  modules are assumed to be self-contained dataset definitions.
* The found dataset definitions are run to generate a dataset, and the
  output checked to see if it's a CSV.

There is some monkeypatching necessary to make this work:

* `codelist_from_csv()` relies on having CSV data available, and the
  checks on valid codelist codes are patched out.  Without further work,
  we don't have any direct way of including data for inline dataset
  definitions in Markdown source, or specifying which mock CSV data to
  use without any established convention for examples to use.  #1697
  proposes ideas to remove this monkeypatching further.
* The sandboxing code is monkeypatched out to use "unsafe" loading of
  dataset definitions. Without doing so, it is not possible to
  monkeypatch any other ehrQL code: the ehrQL is run in a subprocess
  otherwise.

For more details and discussion, see the related PR for this code
(#1648) and the previous PR (#1475) which this approach replaces.
  • Loading branch information
StevenMaude committed Nov 2, 2023
1 parent 3fd3da5 commit 6cbf16b
Show file tree
Hide file tree
Showing 2 changed files with 293 additions and 0 deletions.
Empty file added tests/docs/__init__.py
Empty file.
293 changes: 293 additions & 0 deletions tests/docs/test_complete_examples.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,293 @@
import csv
import inspect
import typing
import unittest.mock
import uuid
from collections.abc import Generator, Iterator
from dataclasses import dataclass
from pathlib import Path

import markdown
import mkdocs.config
import pytest

import ehrql.main


@dataclass
class MarkdownFence:
"""Represents a Markdown fence."""

source: str
language: str


class MarkdownFenceExtractor:
"""Extracts fences from a markdown.Markdown object using the SuperFences extension.
See https://facelessuser.github.io/pymdown-extensions/extensions/superfences/
"""

def __init__(self, content: str) -> None:
self.fences: list[MarkdownFence] = []
self.extension_configs: typing.Mapping[
str, typing.Any
] = self._configure_superfences()
self._extract_fences(content)

def _fence_null_format(
# Argument types are taken from mkdocs-code-validator,
# which has an MIT license,
# but they will be removed before merge.
self,
src: str,
language: str,
css_class: str | None,
options: typing.Mapping[str, typing.Any],
md: markdown.Markdown,
**kwargs,
) -> str:
"""Extract the fences in the same way
as the SuperFences extension does, and make them accessible to the test code.
Returns an empty string.
This null formatter exists only for this purpose.
See https://facelessuser.github.io/pymdown-extensions/extensions/superfences/#formatters
"All formatters should return a string as HTML."
We don't require the formatted text,
only that this method is run and we can access the source
and language."""
self.fences.append(MarkdownFence(source=src, language=language))
return ""

def _configure_superfences(self):
"""Retrieves the existing extensions settings from the mkdocs.yml
configuration, replacing any custom SuperFences fences with a special
test custom fence to extract all fences."""
config_path = Path(__file__).parents[2] / "mkdocs.yml"
config = mkdocs.config.load_config(config_file_path=str(config_path))
assert "pymdownx.superfences" in config["markdown_extensions"]
config["mdx_configs"]["pymdownx.superfences"]["custom_fences"] = [
{
# "name" specifies fences to extract.
"name": "*",
"class": "test",
"format": self._fence_null_format,
},
]
return config["mdx_configs"]

def _extract_fences(self, content: str) -> None:
markdown.Markdown(
extensions=["pymdownx.superfences"],
extension_configs=self.extension_configs,
).convert(content)


@dataclass
class DatasetDefinitionExample:
"""Stores details of a complete ehrQL dataset definition example.
The origin of such an example may be a Markdown fence,
or a standalone Python module."""

path: Path
# This fence number count includes all fences,
# not just the ehrQL fences.
# Standalone Python modules are not given a fence number.
fence_number: int | None
source: str

def relative_path(self) -> Path:
"""Return the relative path of the dataset definition source file
to the source code root."""
source_code_path = Path(__file__).parents[2]
return self.path.relative_to(source_code_path)


def discover_paths(glob_string: str) -> Generator[Path, None, None]:
"""Generate a list of matching files for a glob in the documentation source path."""
docs_path = Path(__file__).parents[2] / "docs"
return docs_path.glob(glob_string)


def find_complete_ehrql_examples_in_markdown(
file: typing.TextIO,
) -> Iterator[DatasetDefinitionExample]:
"""Yields extracted code blocks labelled as ```ehrql from a Markdown file.
Incomplete ehrQL dataset definitions should be labelled as ```python,
and not with ```ehrql."""
f = MarkdownFenceExtractor(file.read())

for fence_number, fence in enumerate(f.fences, start=1):
if fence.language == "ehrql":
example = DatasetDefinitionExample(
path=Path(file.name),
source=fence.source,
fence_number=fence_number,
)
yield example


def generate_complete_ehrql_examples() -> (
Generator[DatasetDefinitionExample, None, None]
):
"""Yields all complete ehrQL DatasetDefinitionExamples from the Markdown documentation."""
markdown_paths = list(discover_paths("**/*.md"))
assert len(markdown_paths) > 0, "No Markdown files found"

for p in markdown_paths:
with open(p) as f:
yield from find_complete_ehrql_examples_in_markdown(f)

dataset_definition_source_paths = list(discover_paths("**/*.py"))
assert len(dataset_definition_source_paths) > 0, "No .py files found"

for p in dataset_definition_source_paths:
with open(p) as f:
content = f.read()
assert len(content) > 0
yield DatasetDefinitionExample(
path=Path(f.name),
fence_number=None,
source=content,
)


def create_example_test_case_id(example: DatasetDefinitionExample) -> str:
"""Returns a test case ID for pytest from a specific DatasetDefinitionExample."""
test_id = f"{example.relative_path()}"
if example.fence_number is not None:
test_id += f"; fence {example.fence_number}"
return test_id


def validate_dataset_output(dataset_path: Path) -> None:
"""Validates that an output dataset file is a CSV."""
with open(dataset_path) as f:
csv_content = f.readlines()

# If the dataset definition works, we should have a valid CSV.
assert len(csv_content) > 0, "CSV is empty for dataset"

# Check we can read the CSV content.
csv_reader = csv.DictReader(csv_content)
for row in csv_reader:
pass


class DatasetDefinitionTestError(Exception):
pass


@pytest.mark.parametrize(
"example",
generate_complete_ehrql_examples(),
ids=create_example_test_case_id,
)
def test_ehrql_generate_dataset_example(
tmp_path: Path, example: DatasetDefinitionExample
) -> None:
tmp_filename_base = str(uuid.uuid4())

tmp_dataset_definition_path = tmp_path / (tmp_filename_base + ".py")
tmp_dataset_definition_path.write_text(example.source)

tmp_dataset_path = tmp_path / (tmp_filename_base + ".csv")

code_column_name = "code"
category_column_name = "category"
tmp_codelist_path = tmp_path / (tmp_filename_base + "_codelist.csv")
tmp_codelist_path.write_text(
f"{code_column_name},{category_column_name}\n"
"not_a_real_code!,not_a_real_category!"
)

codelist_fn = ehrql.codelist_from_csv

def wrapped_codelist_from_csv(*args, **kwargs):
"""Returns the result from ehrql.codelist_from_csv.
This is used to monkeypatch the real ehrql.codelist_from_csv
so that we can use a mock CSV, but it:
* validates the function arguments
* calls the real function with the mock CSV data
Different documentation examples may refer to different CSV columns.
Because of this, we change the arguments passed to codelist_from_csv().
"""
codelist_fn_signature = inspect.signature(codelist_fn)
try:
codelist_fn_signature.bind(*args, **kwargs)
except TypeError as e:
e.add_note("codelist_from_csv() given incorrect arguments")
raise e

return codelist_fn(
filename=tmp_codelist_path,
column=code_column_name,
category_column=category_column_name,
)

def wrapped_load_dataset_definition(definition_file, user_args, _):
"""Wraps ehrql.load_dataset_definition to use the unsafe version
that runs the dataset definition in the same process,
without sandboxing.
This is to remove the additional environ argument that is not used in
load_dataset_definition_unsafe."""
return ehrql.loaders.load_dataset_definition_unsafe(definition_file, user_args)

formatted_example = f"\nEXAMPLE FILENAME {example.path}\nEXAMPLE START\n{example.source}\nEXAMPLE END"

with (
# Patch out the sandbox for now to use the unsafe loader.
# This allows the subsequent monkeypatching of codelist_from_csv.
# By patching load_dataset_definition,
# we can still use the existing ehrql.main.generate_dataset function.
unittest.mock.patch(
"ehrql.main.load_dataset_definition",
wraps=wrapped_load_dataset_definition,
),
unittest.mock.patch(
"ehrql.codelist_from_csv",
wraps=wrapped_codelist_from_csv,
),
# There is no codelist code that satisfies constraints of all code systems,
# so patch out the validity check and just pass in a fake codelist.
unittest.mock.patch(
"ehrql.codes.BaseCode.__post_init__",
return_value=None,
),
):
try:
# No name needed to store a value:
# the output CSV gets written to a temporary file.
ehrql.main.generate_dataset(
tmp_dataset_definition_path,
tmp_dataset_path,
dsn=None,
backend_class=None,
query_engine_class=None,
dummy_tables_path=None,
dummy_data_file=None,
environ={},
user_args=(),
)
except Exception as e:
raise DatasetDefinitionTestError(
f"generate_dataset failed for example: {formatted_example}"
) from e

try:
validate_dataset_output(tmp_dataset_path)
except Exception:
raise DatasetDefinitionTestError(
f"Check of output dataset CSV failed for example: \n{formatted_example}"
)
raise

0 comments on commit 6cbf16b

Please sign in to comment.