dilyabareeva · gumityolcu · Jun 14, 2024 · Jun 4, 2024 · Jun 4, 2024 · Jun 4, 2024
diff --git a/pytest.ini b/pytest.ini
@@ -5,3 +5,5 @@ markers =
     localization_metrics: localization_metrics
     unnamed_metrics: unnamed_metrics
     randomization_metrics: randomization_metrics
+    aggregators: aggregators
+    self_influence: self_influence
diff --git a/src/explainers/aggregators/aggregators.py b/src/explainers/aggregators/aggregators.py
@@ -0,0 +1,43 @@
+from abc import ABC, abstractmethod
+
+import torch
+
+
+class ExplanationsAggregator(ABC):
+    def __init__(self, training_size: int, *args, **kwargs):
+        self.scores = torch.zeros(training_size)
+
+    @abstractmethod
+    def update(self, explanations: torch.Tensor):
+        raise NotImplementedError
+
+    def reset(self, *args, **kwargs):
+        """
+        Used to reset the aggregator state.
+        """
+        self.scores = torch.zeros_like(self.scores)
+
+    def load_state_dict(self, state_dict: dict, *args, **kwargs):
+        """
+        Used to load the aggregator state.
+        """
+        self.scores = state_dict["scores"]
+
+    def state_dict(self, *args, **kwargs):
+        """
+        Used to return the metric state.
+        """
+        return {"scores": self.scores}
+
+    def compute(self) -> torch.Tensor:
+        return self.scores.argsort()
+
+
+class SumAggregator(ExplanationsAggregator):
+    def update(self, explanations: torch.Tensor) -> torch.Tensor:
+        self.scores += explanations.sum(dim=0)
+
+
+class AbsSumAggregator(ExplanationsAggregator):
+    def update(self, explanations: torch.Tensor) -> torch.Tensor:
+        self.scores += explanations.abs().sum(dim=0)
diff --git a/src/explainers/aggregators/self_influence.py b/src/explainers/aggregators/self_influence.py
@@ -0,0 +1,30 @@
+from typing import Optional
+
+import torch
+
+from utils.explain_wrapper import ExplainFunc
+
+
+def get_self_influence_ranking(
+    model: torch.nn.Module,
+    model_id: str,
+    cache_dir: str,
+    training_data: torch.utils.data.Dataset,
+    explain_fn: ExplainFunc,
+    explain_fn_kwargs: Optional[dict] = None,
+) -> torch.Tensor:
+    size = len(training_data)
+    self_inf = torch.zeros((size,))
+
+    for i, (x, y) in enumerate(training_data):
+        self_inf[i] = explain_fn(
+            model=model,
+            model_id=f"{model_id}_id_{i}",
+            cache_dir=cache_dir,
+            test_tensor=x[None],
+            test_label=y[None],
+            train_dataset=training_data,
+            train_ids=[i],
+            **explain_fn_kwargs,
+        )
+    return self_inf.argsort()
diff --git a/src/metrics/localization/identical_class.py b/src/metrics/localization/identical_class.py
@@ -15,11 +15,7 @@ def __init__(
         super().__init__(model, train_dataset, device, *args, **kwargs)
         self.scores = []
 
-    def update(
-        self,
-        test_labels: torch.Tensor,
-        explanations: torch.Tensor
-    ):
+    def update(self, test_labels: torch.Tensor, explanations: torch.Tensor):
         """
         Used to implement metric-specific logic.
         """

diff --git a/src/metrics/randomization/model_randomization.py b/src/metrics/randomization/model_randomization.py
@@ -79,9 +79,7 @@ def update(
         corrs = self.correlation_measure(explanations, rand_explanations)
         self.results["rank_correlations"].append(corrs)
 
-    def compute(
-        self,
-    ):
+    def compute(self):
         return torch.cat(self.results["rank_correlations"]).mean()
 
     def reset(self):

diff --git a/src/metrics/unnamed/top_k_overlap.py b/src/metrics/unnamed/top_k_overlap.py
@@ -29,7 +29,7 @@ def compute(self, *args, **kwargs):
         return len(torch.unique(self.all_top_k_examples))
 
     def reset(self, *args, **kwargs):
-        self.all_top_k_examples = []
+        self.all_top_k_examples = torch.empty(0, self.top_k)
 
     def load_state_dict(self, state_dict: dict, *args, **kwargs):
         self.all_top_k_examples = state_dict["all_top_k_examples"]

diff --git a/src/utils/common.py b/src/utils/common.py
@@ -3,6 +3,8 @@
 from typing import Any, Callable, Mapping
 
 import torch
+import torch.utils
+import torch.utils.data
 
 
 def _get_module_from_name(model: torch.nn.Module, layer_name: str) -> Any:

diff --git a/src/utils/explain_wrapper.py b/src/utils/explain_wrapper.py
@@ -1,8 +1,9 @@
-from typing import Optional, Protocol
+from typing import List, Optional, Protocol, Union
 
 import torch
 from captum.influence import SimilarityInfluence
 
+from src.utils.datasets.indexed_subset import IndexedSubset
 from src.utils.functions.similarities import cosine_similarity
 
 
@@ -12,20 +13,23 @@ def __call__(
         model: torch.nn.Module,
         model_id: str,
         cache_dir: Optional[str],
-        train_dataset: torch.utils.data.Dataset,
-        test_tensor: torch.Tensor,
         method: str,
+        test_tensor: torch.Tensor,
+        train_dataset: torch.utils.data.Dataset,
+        train_ids: Optional[Union[List[int], torch.Tensor]] = None,
     ) -> torch.Tensor:
-        ...
+        pass
 
 
 def explain(
     model: torch.nn.Module,
     model_id: str,
     cache_dir: str,
+    method: str,
     train_dataset: torch.utils.data.Dataset,
     test_tensor: torch.Tensor,
-    method: str,
+    test_target: Optional[torch.Tensor] = None,
+    train_ids: Optional[Union[List[int], torch.Tensor]] = None,
     **kwargs,
 ) -> torch.Tensor:
     """
@@ -41,6 +45,8 @@ def explain(
     :return:
     """
     if method == "SimilarityInfluence":
+        if train_ids is not None:
+            train_dataset = IndexedSubset(dataset=train_dataset, indices=train_ids)
         layer = kwargs.get("layer", "features")
         sim_metric = kwargs.get("similarity_metric", cosine_similarity)
         sim_direction = kwargs.get("similarity_direction", "max")

diff --git a/src/utils/functions/similarities.py b/src/utils/functions/similarities.py
@@ -25,3 +25,23 @@ def cosine_similarity(test, train, replace_nan=0) -> Tensor:
 
     similarity = torch.mm(test, train)
     return similarity
+
+
+def dot_product_similarity(test, train, replace_nan=0) -> Tensor:
+    """
+    Compute cosine similarity between test and train activations.
+
+    :param test:
+    :param train:
+    :param replace_nan:
+    :return:
+    """
+    # TODO: I don't know why Captum return test activations as a list
+    if isinstance(test, list):
+        test = torch.cat(test)
+    assert torch.all(test == train)
+    test = test.view(test.shape[0], -1)
+    train = train.view(train.shape[0], -1)
+
+    similarity = torch.mm(test, train.T)
+    return similarity
diff --git a/tests/explainers/aggregators/test_aggregators.py b/tests/explainers/aggregators/test_aggregators.py
@@ -0,0 +1,47 @@
+import pytest
+import torch
+
+from src.explainers.aggregators.aggregators import (
+    AbsSumAggregator,
+    SumAggregator,
+)
+
+
+@pytest.mark.aggregators
+@pytest.mark.parametrize(
+    "test_id, dataset, explanations",
+    [
+        (
+            "mnist",
+            "load_mnist_dataset",
+            "load_mnist_explanations_1",
+        ),
+    ],
+)
+def test_sum_aggregator(test_id, dataset, explanations, request):
+    dataset = request.getfixturevalue(dataset)
+    explanations = request.getfixturevalue(explanations)
+    aggregator = SumAggregator(training_size=len(dataset))
+    aggregator.update(explanations)
+    global_rank = aggregator.compute()
+    assert torch.allclose(global_rank, explanations.sum(dim=0).argsort())
+
+
+@pytest.mark.aggregators
+@pytest.mark.parametrize(
+    "test_id, dataset, explanations",
+    [
+        (
+            "mnist",
+            "load_mnist_dataset",
+            "load_mnist_explanations_1",
+        ),
+    ],
+)
+def test_abs_aggregator(test_id, dataset, explanations, request):
+    dataset = request.getfixturevalue(dataset)
+    explanations = request.getfixturevalue(explanations)
+    aggregator = AbsSumAggregator(training_size=len(dataset))
+    aggregator.update(explanations)
+    global_rank = aggregator.compute()
+    assert torch.allclose(global_rank, explanations.abs().mean(dim=0).argsort())
diff --git a/tests/explainers/aggregators/test_self_influence.py b/tests/explainers/aggregators/test_self_influence.py
@@ -0,0 +1,38 @@
+from collections import OrderedDict
+
+import pytest
+import torch
+from torch.utils.data import TensorDataset
+
+from src.explainers.aggregators.self_influence import (
+    get_self_influence_ranking,
+)
+from src.utils.explain_wrapper import explain
+from src.utils.functions.similarities import dot_product_similarity
+
+
+@pytest.mark.self_influence
+@pytest.mark.parametrize(
+    "test_id, explain_kwargs",
+    [
+        (
+            "random_data",
+            {"method": "SimilarityInfluence", "layer": "identity", "similarity_metric": dot_product_similarity},
+        ),
+    ],
+)
+def test_self_influence_ranking(test_id, explain_kwargs, request):
+    model = torch.nn.Sequential(OrderedDict([("identity", torch.nn.Identity())]))
+    X = torch.randn(100, 200)
+    rand_dataset = TensorDataset(X, torch.randint(0, 10, (100,)))
+
+    self_influence_rank = get_self_influence_ranking(
+        model=model,
+        model_id="0",
+        cache_dir="temp_captum",
+        training_data=rand_dataset,
+        explain_fn=explain,
+        explain_fn_kwargs=explain_kwargs,
+    )
+
+    assert torch.allclose(self_influence_rank, torch.linalg.norm(X, dim=-1).argsort())
diff --git a/tests/utils/test_explain_wrapper.py b/tests/utils/test_explain_wrapper.py
@@ -30,9 +30,9 @@ def test_explain(test_id, model, dataset, explanations, test_tensor, method, met
         model,
         test_id,
         os.path.join("./cache", "test_id"),
+        method,
         dataset,
         test_tensor,
-        method,
         **method_kwargs,
     )
     assert torch.allclose(explanations, explanations_exp), "Training data attributions are not as expected"