Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Introduce new script that validates the signatures match between the .pyi file and the bridge #7646

Merged
merged 10 commits into from
Oct 9, 2024
Merged
3 changes: 3 additions & 0 deletions .github/workflows/reusable_test_wheels.yml
Original file line number Diff line number Diff line change
Expand Up @@ -224,3 +224,6 @@ jobs:
# --no-py-build because rerun-sdk is already built and installed
# --no-asset-download because we already downloaded the assets
run: pixi run -e wheel-test-min RUST_LOG=debug python docs/snippets/compare_snippet_output.py --target ${{ needs.set-config.outputs.TARGET }} --no-py-build --no-cpp-build --no-asset-download

- name: Check the python library signatures
run: pixi run -e wheel-test-min python scripts/ci/check_python_signatures.py
2 changes: 2 additions & 0 deletions pixi.toml
Original file line number Diff line number Diff line change
Expand Up @@ -305,6 +305,8 @@ py-build = "pixi run -e py py-build-common"
# Dedicated alias for building the python bindings in release mode for the `py` environment.
py-build-release = "pixi run -e py py-build-common-release"

check-py-signatures = "python scripts/ci/check_python_signatures.py"
jleibs marked this conversation as resolved.
Show resolved Hide resolved

# Helper alias to run the python interpreter in the context of the python environment
rrpy = "python"

Expand Down
14 changes: 7 additions & 7 deletions rerun_py/rerun_bindings/rerun_bindings.pyi
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ class IndexColumnDescriptor:
class IndexColumnSelector:
"""A selector for an index column."""

def __new__(cls, index: str): ...
def __init__(self, index: str): ...

class ComponentColumnDescriptor:
"""A column containing the component data."""
Expand All @@ -21,7 +21,7 @@ class ComponentColumnDescriptor:
class ComponentColumnSelector:
"""A selector for a component column."""

def __new__(cls, entity_path: str, component_type: ComponentLike): ...
def __init__(self, entity_path: str, component: ComponentLike): ...
def with_dictionary_encoding(self) -> ComponentColumnSelector: ...

class Schema:
Expand Down Expand Up @@ -63,7 +63,7 @@ class Recording:
"""A single recording."""

def schema(self) -> Schema: ...
def view(self, index: str, contents: ViewContentsLike) -> RecordingView: ...
def view(self, *, index: str, contents: ViewContentsLike) -> RecordingView: ...
def recording_id(self) -> str: ...
def application_id(self) -> str: ...

Expand All @@ -73,27 +73,27 @@ class RRDArchive:
def num_recordings(self) -> int: ...
def all_recordings(self) -> list[Recording]: ...

def load_recording(filename: str | os.PathLike) -> Recording:
def load_recording(path_to_rrd: str | os.PathLike) -> Recording:
"""
Load a single recording from an RRD.

Will raise a `ValueError` if the file does not contain exactly one recording.

Parameters
----------
filename : str
path_to_rrd : str
The path to the file to load.

"""
...

def load_archive(filename: str | os.PathLike) -> RRDArchive:
def load_archive(path_to_rrd: str | os.PathLike) -> RRDArchive:
"""
Load a rerun archive file from disk.

Parameters
----------
filename : str
path_to_rrd : str
The path to the file to load.

"""
Expand Down
4 changes: 3 additions & 1 deletion rerun_py/src/dataframe.rs
Original file line number Diff line number Diff line change
Expand Up @@ -67,6 +67,7 @@ struct PyIndexColumnSelector(TimeColumnSelector);
#[pymethods]
impl PyIndexColumnSelector {
#[new]
#[pyo3(text_signature = "(self, index)")]
fn new(index: &str) -> Self {
Self(TimeColumnSelector {
timeline: index.into(),
Expand Down Expand Up @@ -127,6 +128,7 @@ struct PyComponentColumnSelector(ComponentColumnSelector);
#[pymethods]
impl PyComponentColumnSelector {
#[new]
#[pyo3(text_signature = "(self, entity_path: str, component: ComponentLike)")]
fn new(entity_path: &str, component_name: ComponentLike) -> Self {
Self(ComponentColumnSelector {
entity_path: entity_path.into(),
Expand Down Expand Up @@ -196,7 +198,7 @@ impl AnyComponentColumn {
struct ComponentLike(re_sdk::ComponentName);

impl FromPyObject<'_> for ComponentLike {
fn extract(component: &PyAny) -> PyResult<Self> {
fn extract_bound(component: &Bound<'_, PyAny>) -> PyResult<Self> {
if let Ok(component_str) = component.extract::<String>() {
Ok(Self(component_str.into()))
} else if let Ok(component_str) = component
Expand Down
177 changes: 177 additions & 0 deletions scripts/ci/check_python_signatures.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,177 @@
"""
Compares the signatures in `rerun_bindings.pyi` with the actual runtime signatures in `rerun_bindings.so`.

This does not check that the type annotations match. However, it does ensure that the number of arguments,
the argument names, and whether the arguments are required or have defaults match between the stub and runtime.
"""

from __future__ import annotations

import ast
import importlib
import inspect
import sys
from inspect import Parameter, Signature
from pathlib import Path
from typing import Any

import parso
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Shouldn't this be added to the pixi.toml?

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

It was already in the environment, but good call. I'll make it explicit.


TotalSignature = dict[str, Signature | dict[str, Signature]]


def parse_function_signature(node: Any) -> Signature:
"""Convert a parso function definition node into a Python inspect.Signature object."""
params = []

found_star = False

for param in node.children[2].children:
if param.type == "operator":
if param.value == "*":
found_star = True
continue
param_name = param.name.value
default = Parameter.empty

if param.default:
default = ast.literal_eval(param.default.get_code())

# Determine kind of parameter (positional, keyword, etc.)
if param.star_count == 1:
kind: Any = Parameter.VAR_POSITIONAL # *args
found_star = True
elif param.star_count == 2:
kind = Parameter.VAR_KEYWORD # **kwargs
else:
if param_name == "self":
kind = Parameter.POSITIONAL_ONLY
elif found_star:
kind = Parameter.KEYWORD_ONLY
else:
kind = Parameter.POSITIONAL_OR_KEYWORD

params.append(Parameter(name=param_name, kind=kind, default=default))

return Signature(parameters=params)


def load_stub_signatures(pyi_file: Path) -> TotalSignature:
"""Use parso to parse the .pyi file and convert function and class signatures into inspect.Signature objects."""
pyi_code = Path(pyi_file).read_text()
tree = parso.parse(pyi_code)

signatures: TotalSignature = {}

for node in tree.children:
if node.type == "funcdef":
func_name = node.name.value
func_signature = parse_function_signature(node)
signatures[func_name] = func_signature

elif node.type == "classdef":
class_name = node.name.value
# Extract methods within the class
class_def = {}
for class_node in node.iter_funcdefs():
method_name = class_node.name.value

method_signature = parse_function_signature(class_node)

class_def[method_name] = method_signature

signatures[class_name] = class_def

return signatures


def load_runtime_signatures(module_name: str) -> TotalSignature:
"""Use inspect to extract runtime signatures for both functions and classes."""
module = importlib.import_module(module_name)

signatures: TotalSignature = {}

# Get top-level functions and classes
for name, obj in inspect.getmembers(module):
if inspect.isfunction(obj):
signatures[name] = inspect.signature(obj)
elif inspect.isbuiltin(obj):
signatures[name] = inspect.signature(obj)
elif inspect.isclass(obj):
class_def = {}
# Get methods within the class
for method_name, method_obj in inspect.getmembers(obj):
# Need special handling for __init__ methods because pyo3 doesn't expose them as functions
# Instead we use the __text_signature__ attribute from the class
if method_name == "__init__" and obj.__text_signature__ is not None:
sig = "def __init__" + obj.__text_signature__ + ": ..." # NOLINT
parsed = parso.parse(sig).children[0]
class_def[method_name] = parse_function_signature(parsed)
continue
try:
class_def[method_name] = inspect.signature(method_obj)
except Exception:
pass
signatures[name] = class_def

return signatures


def compare_signatures(stub_signatures: TotalSignature, runtime_signatures: TotalSignature) -> int:
"""Compare stub signatures with runtime signatures."""

result = 0

for name, stub_signature in stub_signatures.items():
if isinstance(stub_signature, dict):
if name in runtime_signatures:
runtime_class_signature = runtime_signatures.get(name)
if not isinstance(runtime_class_signature, dict):
print(f"{name} signature mismatch:")
print(f" Stub: {stub_signature}")
print(f" Runtime: {runtime_class_signature}")
result += 1
continue
for method_name, stub_method_signature in stub_signature.items():
runtime_method_signature = runtime_class_signature.get(method_name)
if runtime_method_signature != stub_method_signature:
print(f"{name}.{method_name}(…) signature mismatch:")
print(f" Stub: {stub_method_signature}")
print(f" Runtime: {runtime_method_signature}")
result += 1

else:
print(f"Class {name} not found in runtime")
result += 1
else:
if name in runtime_signatures:
# Handle top-level functions
runtime_signature = runtime_signatures.get(name)
if runtime_signature != stub_signature:
print(f"{name}(…) signature mismatch:")
print(f" Stub: {stub_signature}")
print(f" Runtime: {runtime_signature}")
result += 1
else:
print(f"Function {name} not found in runtime")
result += 1

if result == 0:
print("All stub signatures match!")

return result


def main() -> int:
# load the stub file
path_to_stub = Path(__file__).parent / ".." / ".." / "rerun_py" / "rerun_bindings" / "rerun_bindings.pyi"
jleibs marked this conversation as resolved.
Show resolved Hide resolved
stub_signatures = load_stub_signatures(path_to_stub)

# load the runtime signatures
runtime_signatures = load_runtime_signatures("rerun_bindings")

sys.exit(compare_signatures(stub_signatures, runtime_signatures))


if __name__ == "__main__":
main()
Loading