Skip to content

Commit

Permalink
Add diff_definitions.py
Browse files Browse the repository at this point in the history
This new script makes it easy to compare the current definitions
of events and other types against a chosen base, e.g. the current
state of the master branch or a previous edition. It produces diff
commands that can be run to produce the wanted comparison.

Since figuring out the most recent version of each type is a pretty
common operation, a new versions module is introduced for this purpose.
The existing find-latest-schemas.py script has been adapted to use the
new module.
  • Loading branch information
magnusbaeck committed Jan 7, 2024
1 parent d09c69f commit 2c28aa3
Show file tree
Hide file tree
Showing 4 changed files with 232 additions and 22 deletions.
61 changes: 61 additions & 0 deletions diff_definitions.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,61 @@
#!/usr/bin/env python3

# Copyright 2024 Axis Communications AB.
# For a full list of individual contributors, please see the commit history.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Context-sensitive diffing of Eiffel type definitions. Compares the
currently available types with the ones from a specified base and
prints diff commands. For example, if the current commit has added
v4.3.0 of ActT you'll get the following output:
diff -u definitions/EiffelActivityTriggeredEvent/4.2.0.yml definitions/EiffelActivityTriggeredEvent/4.3.0.yml
diff -u schemas/EiffelActivityTriggeredEvent/4.2.0.json schemas/EiffelActivityTriggeredEvent/4.3.0.json
By default, the base of the comparison is origin/master, but any commit
reference can be given as an argument.
"""

import sys
from pathlib import Path

import versions


def _main():
base = "origin/master"
if len(sys.argv) > 2:
print(f"Usage: python {sys.argv[0]} [ base ]")
sys.exit(-1)
elif len(sys.argv) == 2:
base = sys.argv[1]

earlier = versions.latest_in_gitref(base, ".", Path("definitions"))
current = versions.latest_in_dir(Path("definitions"))
for type, current_version in sorted(current.items()):
earlier_version = earlier.get(type)
if not earlier_version:
print(f"diff -u /dev/null definitions/{type}/{current_version}.yml")
print(f"diff -u /dev/null schemas/{type}/{current_version}.json")
elif earlier_version != current_version:
print(
f"diff -u definitions/{type}/{earlier_version}.yml definitions/{type}/{current_version}.yml"
)
print(
f"diff -u schemas/{type}/{earlier_version}.json schemas/{type}/{current_version}.json"
)


if __name__ == "__main__":
_main()
35 changes: 13 additions & 22 deletions find-latest-schemas.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
import os
import sys
from pathlib import Path
from shutil import copyfile

import semver
import versions

"""
Finds the latest versions of schemas found under <input_folder>, with
Expand All @@ -16,28 +16,19 @@

def main():
if len(sys.argv) != 3:
print("Usage: python {} input_folder output_folder".format(sys.argv[0]))
print(f"Usage: python {sys.argv[0]} input_folder output_folder")
sys.exit(-1)

input_folder = sys.argv[1]
output_folder = sys.argv[2]

if not os.path.exists(output_folder):
os.makedirs(output_folder)

latest_versions = []
for base, _, files in os.walk(input_folder):
if len(files) != 0:
latest_version = "0.0.0"
for f in files:
latest_version = semver.max_ver(latest_version, os.path.splitext(f)[0])
latest_versions.append(os.path.join(base, latest_version + ".json"))

for f in latest_versions:
new_name = os.path.split(os.path.dirname(f))[1] + ".json"
output_file = os.path.join(output_folder, new_name)
copyfile(f, output_file)
print("{} => {}".format(f, output_file))
input_folder = Path(sys.argv[1])
output_folder = Path(sys.argv[2])

output_folder.mkdir(exist_ok=True)

for type, version in versions.latest_in_dir(input_folder).items():
input_file = input_folder / type / f"{version}.json"
output_file = output_folder / f"{type}.json"
copyfile(input_file, output_file)
print(f"{input_file} => {output_file}")


if __name__ == "__main__":
Expand Down
90 changes: 90 additions & 0 deletions test_versions.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,90 @@
# Copyright 2024 Axis Communications AB.
# For a full list of individual contributors, please see the commit history.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import subprocess
from pathlib import Path

import pytest
import semver

import versions


class Git:
"""Simple class for running Git commands in a given directory."""

def __init__(self, path: Path):
self.path = path
self.command("init")

def command(self, *args: str) -> None:
subprocess.check_call(["git"] + list(args), cwd=self.path)


@pytest.fixture
def tmp_git(tmp_path):
"""Injects a Git instance rooted in a temporary directory."""
yield Git(tmp_path)


def create_files(base_path: Path, *args: str) -> None:
for p in args:
fullpath = base_path / p
fullpath.parent.mkdir(parents=True, exist_ok=True)
fullpath.touch()


def test_latest_in_gitref(tmp_git):
# Create a bunch of files in the git, commit them, and tag that commit.
create_files(
tmp_git.path,
"subdir_c/6.0.0.json",
"definitions/subdir_a/1.0.0.json",
"definitions/subdir_a/2.0.0.json",
"definitions/subdir_b/3.0.0.json",
"definitions/subdir_b/4.0.0.json",
)
tmp_git.command("add", "-A")
tmp_git.command("commit", "-m", "Initial set of files")
tmp_git.command("tag", "v1.0.0")

# Add an additional file and delete one of the original files.
(tmp_git.path / "definitions/subdir_b/5.0.0.json").touch()
tmp_git.command("rm", "definitions/subdir_a/2.0.0.json")
tmp_git.command("add", "-A")
tmp_git.command("commit", "-m", "Make changes")

# Make sure the results we get are consistent with the original
# contents of the git.
assert versions.latest_in_gitref("v1.0.0", tmp_git.path, "definitions") == {
"subdir_a": semver.VersionInfo.parse("2.0.0"),
"subdir_b": semver.VersionInfo.parse("4.0.0"),
}


def test_latest_in_dir(tmp_path):
create_files(
tmp_path,
"subdir_c/6.0.0.json",
"definitions/subdir_a/1.0.0.json",
"definitions/subdir_a/2.0.0.json",
"definitions/subdir_b/3.0.0.json",
"definitions/subdir_b/4.0.0.json",
)

assert versions.latest_in_dir(tmp_path / "definitions") == {
"subdir_a": semver.VersionInfo.parse("2.0.0"),
"subdir_b": semver.VersionInfo.parse("4.0.0"),
}
68 changes: 68 additions & 0 deletions versions.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,68 @@
# Copyright 2024 Axis Communications AB.
# For a full list of individual contributors, please see the commit history.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""The versions module contains functions for discovering definition files."""

import os
import subprocess
from pathlib import Path
from typing import Dict
from typing import Iterable

import semver


def latest_in_gitref(
committish: str, gitdir: Path, subdir: Path
) -> Dict[str, semver.version.Version]:
"""Lists the definition files found under a given subdirectory of a
git at a given point in time (described by a committish, e.g. a
SHA-1, tag, or branch reference) and returns a dict that maps each
typename (e.g. EiffelArtifactCreatedEvent) to the latest version found.
"""
return _latest_versions(
Path(line)
for line in (
subprocess.check_output(
["git", "ls-tree", "-r", "--name-only", committish, "--", subdir],
cwd=gitdir,
)
.decode("utf-8")
.splitlines()
)
)


def latest_in_dir(path: Path) -> Dict[str, semver.version.Version]:
"""Inspects the definition files found under a given path and returns
a dict that maps each typename (e.g. EiffelArtifactCreatedEvent) to
its latest version found.
"""
return _latest_versions(
Path(current) / f for current, _, files in os.walk(path) for f in files
)


def _latest_versions(paths: Iterable[Path]) -> Dict[str, semver.version.Version]:
"""Given a list of foo/<typename>/<version>.<ext> pathnames, returns
a dict mapping typenames to the most recent version of that type.
"""
result = {}
for path in paths:
type = path.parent.name
this_version = semver.VersionInfo.parse(Path(path.name).stem)
if type not in result or result[type] < this_version:
result[type] = this_version
return result

0 comments on commit 2c28aa3

Please sign in to comment.