python(refactor): rules module (#113)

sift-stack · Nov 4, 2024 · fa4fe4c · fa4fe4c
1 parent 59809b7
commit fa4fe4c
Show file tree

Hide file tree

Showing 4 changed files with 303 additions and 291 deletions.
diff --git a/python/lib/sift_py/ingestion/rule/__init__.py b/python/lib/sift_py/ingestion/rule/__init__.py
@@ -1,3 +1,4 @@
 """
-Concerned with loading in rules to use during ingestion.
+This module is deprecated and exists only to re-export members
+of `sift_py.rule`. Prefer to use that module.
 """
diff --git a/python/lib/sift_py/ingestion/rule/config.py b/python/lib/sift_py/ingestion/rule/config.py
@@ -1,290 +1,11 @@
-from __future__ import annotations
-
-from abc import ABC, abstractmethod
-from enum import Enum
-from typing import Any, Dict, List, Optional, Tuple, TypedDict, Union, cast
-
-from sift.annotations.v1.annotations_pb2 import AnnotationType
-from sift.rules.v1.rules_pb2 import ActionKind
-
-from sift_py._internal.convert.json import AsJson
-from sift_py.ingestion.channel import ChannelConfig
-from sift_py.ingestion.config.yaml.spec import RuleYamlSpec
-
-
-class RuleConfig(AsJson):
-    """
-    Defines a rule to be used during ingestion. If a rule's expression validates to try, then
-    a specific action will take place as specified by the `kind` attribute.
-
-    - `name`: Name of the rule.
-    - `description`: Description of the rule.
-    - `expression`: A CEL string expression, that, when evaluated to a truthy value, executes the `action`.
-    - `action`: The action to execute if the result of an `expression` evaluates to a truthy value.
-    - `channel_references`: Reference to channel. If an expression is "$1 < 10", then "$1" is the reference and thus should the key in the dict.
-    - `rule_client_key`: User defined unique string that uniquely identifies this rule.
-    - `asset_names`: A list of asset names that this rule should be applied to. ONLY VALID if defining rules outside of a telemetry config.
-    - `tag_names`: A list of asset names that this rule should be applied to. ONLY VALID if defining rules outside of a telemetry config.
-    - `namespace`: A string key that refers to a namespace where a rule is defined. Namespaces are defined in YAML.
-    - `namespace_rules`: A dictionary of rules loaded from a namespace YAML.
-    """
-
-    name: str
-    description: str
-    expression: str
-    action: Optional[RuleAction]
-    channel_references: List[ExpressionChannelReference]
-    rule_client_key: Optional[str]
-    asset_names: List[str]
-
-    def __init__(
-        self,
-        name: str,
-        channel_references: List[
-            Union[ExpressionChannelReference, ExpressionChannelReferenceChannelConfig]
-        ],
-        description: str = "",
-        expression: str = "",
-        action: Optional[RuleAction] = None,
-        rule_client_key: Optional[str] = None,
-        asset_names: Optional[List[str]] = None,
-        tag_names: Optional[List[str]] = None,
-        sub_expressions: Dict[str, Any] = {},
-        namespace: str = "",
-        namespace_rules: Dict[str, List[RuleYamlSpec]] = {},
-    ):
-        self.channel_references = []
-
-        for channel_reference in channel_references:
-            config = channel_reference.get("channel_config")
-
-            if config is not None:
-                config = cast(ChannelConfig, config)
-
-                self.channel_references.append(
-                    {
-                        "channel_reference": channel_reference["channel_reference"],
-                        "channel_identifier": config.fqn(),
-                    }
-                )
-            else:
-                channel_ref = cast(ExpressionChannelReference, channel_reference)
-
-                self.channel_references.append(
-                    {
-                        "channel_reference": channel_ref["channel_reference"],
-                        "channel_identifier": channel_ref["channel_identifier"],
-                    }
-                )
-
-        self.name = name
-
-        if namespace:
-            description, expression, rule_client_key, action, asset_names, tag_names = (
-                self.__class__.interpolate_namespace_rule(name, namespace, namespace_rules)
-            )
-
-        if asset_names:
-            self.asset_names = asset_names
-
-        self.action = action
-        self.rule_client_key = rule_client_key
-        self.description = description
-        self.expression = self.__class__.interpolate_sub_expressions(expression, sub_expressions)
-
-    def as_json(self) -> Any:
-        """
-        Produces the appropriate JSON structure that's suitable for the Rules API.
-        """
-
-        hash_map: Dict[str, Union[List[ExpressionChannelReference], str, List[str], None]] = {
-            "name": self.name,
-            "description": self.description,
-            "expression": self.expression,
-        }
-
-        hash_map["expression_channel_references"] = self.channel_references
-
-        if isinstance(self.action, RuleActionCreateDataReviewAnnotation):
-            hash_map["type"] = RuleActionAnnotationKind.REVIEW.value
-            hash_map["assignee"] = self.action.assignee
-
-            if self.action.assignee is not None and len(self.action.assignee) > 0:
-                hash_map["assignee"] = self.action.assignee
-
-            if self.action.tags is not None and len(self.action.tags) > 0:
-                hash_map["tags"] = self.action.tags
-
-        elif isinstance(self.action, RuleActionCreatePhaseAnnotation):
-            hash_map["type"] = RuleActionAnnotationKind.PHASE.value
-
-            if self.action.tags is not None and len(self.action.tags) > 0:
-                hash_map["tags"] = self.action.tags
-        else:
-            kind = self.action.kind() if self.action else self.action
-            raise TypeError(f"Unsupported rule action '{kind}'.")
-
-        return hash_map
-
-    @staticmethod
-    def interpolate_sub_expressions(
-        expression: str, sub_expressions: Optional[Dict[str, str]]
-    ) -> str:
-        if sub_expressions:
-            for ref, expr in sub_expressions.items():
-                if ref not in expression:
-                    raise ValueError(f"Couldn't find '{ref}' in expression '{expression}'.")
-                if isinstance(expr, str):
-                    expression = expression.replace(ref, f'"{expr}"')
-                else:
-                    expression = expression.replace(ref, str(expr))
-
-        return expression
-
-    @staticmethod
-    def interpolate_namespace_rule(
-        name: str, namespace: str, namespace_rules: Optional[Dict[str, List[RuleYamlSpec]]]
-    ) -> Tuple[str, str, str, RuleAction, List[str], List[str]]:
-        if not namespace_rules:
-            raise ValueError(
-                f"Namespace rules must be provided with namespace key. Got: {namespace_rules}"
-            )
-
-        rule_list = namespace_rules.get(namespace)
-        if not rule_list:
-            raise ValueError(
-                f"Couldn't find namespace '{namespace}' in namespace_rules: {namespace_rules}"
-            )
-
-        candidate_name = None
-        for rule in rule_list:
-            candidate_name = rule.get("name")
-
-            if not candidate_name:
-                break
-
-            if candidate_name == name:
-                description = rule.get("description", "")
-                expression = rule.get("expression", "")
-                type = rule.get("type", "")
-                tags = rule.get("tags")
-                rule_client_key = rule.get("rule_client_key", "")
-                asset_names = rule.get("asset_names", [])
-                tag_names = rule.get("tag_names", [])
-                action: RuleAction = RuleActionCreatePhaseAnnotation(tags)
-                if RuleActionAnnotationKind.from_str(type) == RuleActionAnnotationKind.REVIEW:
-                    action = RuleActionCreateDataReviewAnnotation(
-                        assignee=rule.get("assignee"), tags=tags
-                    )
-                return (
-                    description,
-                    cast(str, expression),
-                    rule_client_key,
-                    action,
-                    asset_names,
-                    tag_names,
-                )
-
-        raise ValueError(
-            f"Could not find rule '{candidate_name}'. Does this rule exist in the namespace? {rule_list}"
-        )
-
-
-class RuleAction(ABC):
-    @abstractmethod
-    def kind(self) -> RuleActionKind:
-        pass
-
-
-class RuleActionCreateDataReviewAnnotation(RuleAction):
-    """
-    Action to create a data-review annotation when a rule evaluates to a truthy value.
-
-    - `tags`: List of tag names to associate with the newly created data-review annotation.
-    - `assignee`: Email of user in organization to assign the newly created data-review annotation.
-    """
-
-    tags: Optional[List[str]]
-    assignee: Optional[str]
-
-    def __init__(self, assignee: Optional[str] = None, tags: Optional[List[str]] = None):
-        self.assignee = assignee
-        self.tags = tags
-
-    def kind(self) -> RuleActionKind:
-        return RuleActionKind.ANNOTATION
-
-
-class RuleActionCreatePhaseAnnotation(RuleAction):
-    """
-    Action to create a phase annotation when a rule evaluates to a truthy value.
-
-    - `tags`: List of tag names to associate with the newly created data-review annotation.
-    """
-
-    tags: Optional[List[str]]
-
-    def __init__(self, tags: Optional[List[str]] = None):
-        self.tags = tags
-
-    def kind(self) -> RuleActionKind:
-        return RuleActionKind.ANNOTATION
-
-
-class RuleActionAnnotationKind(Enum):
-    REVIEW = "review"
-    PHASE = "phase"
-
-    @classmethod
-    def from_annotation_type(cls, annotation_type: AnnotationType) -> "RuleActionAnnotationKind":
-        if annotation_type == AnnotationType.ANNOTATION_TYPE_PHASE:
-            return cls.PHASE
-        return cls.PHASE
-
-    @classmethod
-    def from_str(cls, val: str) -> "RuleActionAnnotationKind":
-        if val == cls.REVIEW.value:
-            return cls.REVIEW
-        elif val == cls.PHASE.value:
-            return cls.PHASE
-        else:
-            raise ValueError("Argument 'val' is not a valid annotation kind.")
-
-
-class RuleActionKind(Enum):
-    NOTIFICATION = ActionKind.NOTIFICATION
-    ANNOTATION = ActionKind.ANNOTATION
-
-    @classmethod
-    def from_str(cls, val: str) -> Optional["RuleActionKind"]:
-        if val == "ACTION_KIND_NOTIFICATION" or val == RuleActionKindStrRep.NOTIFICATION.value:
-            return cls.NOTIFICATION
-        elif val == "ACTION_KIND_ANNOTATION" or val == RuleActionKindStrRep.ANNOTATION.value:
-            return cls.ANNOTATION
-
-        return None
-
-
-class RuleActionKindStrRep(Enum):
-    NOTIFICATION = "notification"
-    ANNOTATION = "annotation"
-
-
-class ExpressionChannelReference(TypedDict):
-    """
-    `channel_reference`: The channel reference (e.g. '$1') used in the expression.
-    `channel_identifier`: The fully qualified channel name. See `sift_py.ingestion.channel.channel_fqn`.
-    """
-
-    channel_reference: str
-    channel_identifier: str
-
-
-class ExpressionChannelReferenceChannelConfig(TypedDict):
-    """
-    `channel_reference`: The channel reference (e.g. '$1') used in the expression.
-    `channel_config`: Instance of `sift_py.ingestion.channel.ChannelConfig`.
-    """
-
-    channel_reference: str
-    channel_config: ChannelConfig
+import sift_py.rule.config as rule_config
+
+RuleConfig = rule_config.RuleConfig
+RuleAction = rule_config.RuleAction
+RuleActionCreateDataReviewAnnotation = rule_config.RuleActionCreateDataReviewAnnotation
+RuleActionCreatePhaseAnnotation = rule_config.RuleActionCreatePhaseAnnotation
+RuleActionAnnotationKind = rule_config.RuleActionAnnotationKind
+RuleActionKind = rule_config.RuleActionKind
+RuleActionKindStrRep = rule_config.RuleActionKindStrRep
+ExpressionChannelReference = rule_config.ExpressionChannelReference
+ExpressionChannelReferenceChannelConfig = rule_config.ExpressionChannelReferenceChannelConfig
diff --git a/...lib/sift_py/ingestion/rule/config_test.py → python/lib/sift_py/rule/_config_test.py b/...lib/sift_py/ingestion/rule/config_test.py → python/lib/sift_py/rule/_config_test.py