Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add verify-alpha-spec hook #28

Merged
merged 21 commits into from
May 28, 2024
Merged
Show file tree
Hide file tree
Changes from 20 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
7 changes: 7 additions & 0 deletions .pre-commit-hooks.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,13 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
- id: verify-alpha-spec
name: verify-alpha-spec
description: make sure RAPIDS packages have correct alpha spec
entry: verify-alpha-spec
language: python
files: dependencies[.]yaml$
args: [--fix]
- id: verify-conda-yes
name: pass -y/--yes to conda
description: make sure that all calls to conda pass -y/--yes
Expand Down
3 changes: 3 additions & 0 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -32,8 +32,10 @@ classifiers = [
]
requires-python = ">=3.9"
dependencies = [
"PyYAML",
"bashlex",
"gitpython",
"packaging",
"rich",
"tomlkit",
]
Expand All @@ -45,6 +47,7 @@ test = [
]

[project.scripts]
verify-alpha-spec = "rapids_pre_commit_hooks.alpha_spec:main"
verify-conda-yes = "rapids_pre_commit_hooks.shell.verify_conda_yes:main"
verify-copyright = "rapids_pre_commit_hooks.copyright:main"
verify-pyproject-license = "rapids_pre_commit_hooks.pyproject_license:main"
Expand Down
215 changes: 215 additions & 0 deletions src/rapids_pre_commit_hooks/alpha_spec.py
vyasr marked this conversation as resolved.
Show resolved Hide resolved
Original file line number Diff line number Diff line change
@@ -0,0 +1,215 @@
# Copyright (c) 2024, NVIDIA CORPORATION.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import re
from functools import total_ordering

import yaml
from packaging.requirements import Requirement

from .lint import LintMain

RAPIDS_ALPHA_SPEC_PACKAGES = {
KyleFromNVIDIA marked this conversation as resolved.
Show resolved Hide resolved
"cubinlinker",
"cucim",
"cudf",
"cugraph",
"cugraph-dgl",
"cugraph-equivariant",
"cugraph-pyg",
"cuml",
"cuproj",
"cuspatial",
"cuxfilter",
"dask-cudf",
"distributed-ucxx",
"librmm",
"libucx",
"nx-cugraph",
"ptxcompiler",
"pylibcugraph",
"pylibcugraphops",
"pylibraft",
"pylibwholegraph",
"pynvjitlink",
"raft-dask",
"rmm",
"ucx-py",
"ucxx",
}

RAPIDS_CUDA_SUFFIXED_PACKAGES = set(RAPIDS_ALPHA_SPEC_PACKAGES)
KyleFromNVIDIA marked this conversation as resolved.
Show resolved Hide resolved

ALPHA_SPECIFIER = ">=0.0.0a0"

ALPHA_SPEC_OUTPUT_TYPES = {
"pyproject",
"requirements",
}

CUDA_SUFFIX_REGEX = re.compile(r"^(?P<package>.*)-cu[0-9]{2}$")


def node_has_type(node, tag_type):
return node.tag == f"tag:yaml.org,2002:{tag_type}"


def is_rapids_cuda_suffixed_package(name):
return any(
(match := CUDA_SUFFIX_REGEX.search(name)) and match.group("package") == package
for package in RAPIDS_CUDA_SUFFIXED_PACKAGES
)


def check_package_spec(linter, args, node):
@total_ordering
class SpecPriority:
def __init__(self, spec):
self.spec = spec

def __eq__(self, other):
return self.spec == other.spec

def __lt__(self, other):
if self.spec == other.spec:
return False
if self.spec == ALPHA_SPECIFIER:
return False
if other.spec == ALPHA_SPECIFIER:
return True
return self.sort_str() < other.sort_str()

def sort_str(self):
return "".join(c for c in self.spec if c not in "<>=")

def create_specifier_string(specifiers):
return ",".join(sorted(specifiers, key=SpecPriority))

if node_has_type(node, "str"):
req = Requirement(node.value)
if req.name in RAPIDS_ALPHA_SPEC_PACKAGES or is_rapids_cuda_suffixed_package(
req.name
):
has_alpha_spec = any(str(s) == ALPHA_SPECIFIER for s in req.specifier)
if args.mode == "development" and not has_alpha_spec:
linter.add_warning(
(node.start_mark.index, node.end_mark.index),
f"add alpha spec for RAPIDS package {req.name}",
).add_replacement(
(node.start_mark.index, node.end_mark.index),
str(
req.name
+ create_specifier_string(
{str(s) for s in req.specifier} | {ALPHA_SPECIFIER}
)
),
)
elif args.mode == "release" and has_alpha_spec:
linter.add_warning(
(node.start_mark.index, node.end_mark.index),
f"remove alpha spec for RAPIDS package {req.name}",
).add_replacement(
(node.start_mark.index, node.end_mark.index),
str(
req.name
+ create_specifier_string(
{str(s) for s in req.specifier} - {ALPHA_SPECIFIER}
)
),
)


def check_packages(linter, args, node):
if node_has_type(node, "seq"):
for package_spec in node.value:
check_package_spec(linter, args, package_spec)


def check_common(linter, args, node):
if node_has_type(node, "seq"):
for dependency_set in node.value:
if node_has_type(dependency_set, "map"):
for dependency_set_key, dependency_set_value in dependency_set.value:
if (
node_has_type(dependency_set_key, "str")
and dependency_set_key.value == "packages"
):
check_packages(linter, args, dependency_set_value)


def check_matrices(linter, args, node):
if node_has_type(node, "seq"):
for item in node.value:
if node_has_type(item, "map"):
for matrix_key, matrix_value in item.value:
if (
node_has_type(matrix_key, "str")
and matrix_key.value == "packages"
):
check_packages(linter, args, matrix_value)


def check_specific(linter, args, node):
if node_has_type(node, "seq"):
for matrix_matcher in node.value:
if node_has_type(matrix_matcher, "map"):
for matrix_matcher_key, matrix_matcher_value in matrix_matcher.value:
if (
node_has_type(matrix_matcher_key, "str")
and matrix_matcher_key.value == "matrices"
):
check_matrices(linter, args, matrix_matcher_value)


def check_dependencies(linter, args, node):
if node_has_type(node, "map"):
for _, dependencies_value in node.value:
if node_has_type(dependencies_value, "map"):
for dependency_key, dependency_value in dependencies_value.value:
if node_has_type(dependency_key, "str"):
if dependency_key.value == "common":
check_common(linter, args, dependency_value)
elif dependency_key.value == "specific":
check_specific(linter, args, dependency_value)


def check_root(linter, args, node):
if node_has_type(node, "map"):
for root_key, root_value in node.value:
if node_has_type(root_key, "str") and root_key.value == "dependencies":
check_dependencies(linter, args, root_value)


def check_alpha_spec(linter, args):
check_root(linter, args, yaml.compose(linter.content))


def main():
m = LintMain()
m.argparser.description = (
"Verify that RAPIDS packages in dependencies.yaml do (or do not) have "
"the alpha spec."
)
m.argparser.add_argument(
"--mode",
help="mode to use (development has alpha spec, release does not)",
choices=["development", "release"],
default="development",
)
with m.execute() as ctx:
ctx.add_check(check_alpha_spec)


if __name__ == "__main__":
main()
Loading