Fixes

vivekmig · vivekmig · commit 6b71d66d9329 · 2021-02-19T13:44:05.000-08:00
diff --git a/captum/attr/_core/kernel_shap.py b/captum/attr/_core/kernel_shap.py
@@ -1,6 +1,5 @@
 #!/usr/bin/env python3
 
-import math
 from typing import Any, Callable, Generator, Tuple, Union
 
 import torch
@@ -17,57 +16,6 @@
 from captum.log import log_usage
 
 
-def combination(n: int, k: int) -> int:
-    try:
-        # Combination only available in Python 3.8
-        return math.comb(n, k)  # type: ignore
-    except AttributeError:
-        return math.factorial(n) // math.factorial(k) // math.factorial(n - k)
-
-
-def kernel_shap_similarity_kernel(
-    _, __, interpretable_sample: Tensor, **kwargs
-) -> Tensor:
-    assert (
-        "num_interp_features" in kwargs
-    ), "Must provide num_interp_features to use default similarity kernel"
-    num_selected_features = int(interpretable_sample.sum(dim=1).item())
-    num_features = kwargs["num_interp_features"]
-    if num_selected_features == 0 or num_selected_features == num_features:
-        # weight should be theoretically infinite when denom = 0
-        # enforcing that trained linear model must satisfy
-        # end-point criteria. In practice, it is sufficient to
-        # make this weight substantially larger so setting this
-        # weight to 1000000 (all other weights are 1).
-        similarities = 1000000.0
-    else:
-        similarities = 1.0
-    return torch.tensor([similarities])
-
-
-def kernel_shap_perturb_generator(
-    original_inp, **kwargs
-) -> Generator[Tensor, None, None]:
-    assert "num_select_distribution" in kwargs and "num_interp_features" in kwargs, (
-        "num_select_distribution and num_interp_features are necessary"
-        " to use kernel_shap_perturb_func"
-    )
-    if isinstance(original_inp, Tensor):
-        device = original_inp.device
-    else:
-        device = original_inp[0].device
-    num_features = kwargs["num_interp_features"]
-    yield torch.ones(1, num_features, device=device, dtype=torch.long)
-    yield torch.zeros(1, num_features, device=device, dtype=torch.long)
-    while True:
-        num_selected_features = kwargs["num_select_distribution"].sample()
-        rand_vals = torch.randn(1, num_features)
-        threshold = torch.kthvalue(
-            rand_vals, num_features - num_selected_features
-        ).values.item()
-        yield (rand_vals > threshold).to(device=device).long()
-
-
 class KernelShap(Lime):
     r"""
     Kernel SHAP is a method that uses the LIME framework to compute
@@ -92,9 +40,10 @@ def __init__(self, forward_func: Callable) -> None:
             self,
             forward_func,
             interpretable_model=SkLearnLinearRegression(),
-            similarity_func=kernel_shap_similarity_kernel,
-            perturb_func=kernel_shap_perturb_generator,
+            similarity_func=self.kernel_shap_similarity_kernel,
+            perturb_func=self.kernel_shap_perturb_generator,
         )
+        self.inf_weight = 1000000.0
 
     @log_usage()
     @lime_n_perturb_samples_deprecation_decorator
@@ -337,3 +286,46 @@ def attribute(  # type: ignore
             return_input_shape=return_input_shape,
             num_select_distribution=Categorical(probs),
         )
+
+    def kernel_shap_similarity_kernel(
+        self, _, __, interpretable_sample: Tensor, **kwargs
+    ) -> Tensor:
+        assert (
+            "num_interp_features" in kwargs
+        ), "Must provide num_interp_features to use default similarity kernel"
+        num_selected_features = int(interpretable_sample.sum(dim=1).item())
+        num_features = kwargs["num_interp_features"]
+        if num_selected_features == 0 or num_selected_features == num_features:
+            # weight should be theoretically infinite when denom = 0
+            # enforcing that trained linear model must satisfy
+            # end-point criteria. In practice, it is sufficient to
+            # make this weight substantially larger so setting this
+            # weight to 1000000 (all other weights are 1).
+            similarities = self.inf_weight
+        else:
+            similarities = 1.0
+        return torch.tensor([similarities])
+
+    def kernel_shap_perturb_generator(
+        self, original_inp: Union[Tensor, Tuple[Tensor, ...]], **kwargs
+    ) -> Generator[Tensor, None, None]:
+        assert (
+            "num_select_distribution" in kwargs and "num_interp_features" in kwargs
+        ), (
+            "num_select_distribution and num_interp_features are necessary"
+            " to use kernel_shap_perturb_func"
+        )
+        if isinstance(original_inp, Tensor):
+            device = original_inp.device
+        else:
+            device = original_inp[0].device
+        num_features = kwargs["num_interp_features"]
+        yield torch.ones(1, num_features, device=device, dtype=torch.long)
+        yield torch.zeros(1, num_features, device=device, dtype=torch.long)
+        while True:
+            num_selected_features = kwargs["num_select_distribution"].sample()
+            rand_vals = torch.randn(1, num_features)
+            threshold = torch.kthvalue(
+                rand_vals, num_features - num_selected_features
+            ).values.item()
+            yield (rand_vals > threshold).to(device=device).long()
diff --git a/captum/attr/_core/lime.py b/captum/attr/_core/lime.py
@@ -73,7 +73,7 @@ def __init__(
         forward_func: Callable,
         interpretable_model: Model,
         similarity_func: Callable,
-        perturb_func: Union[Callable],
+        perturb_func: Callable,
         perturb_interpretable_space: bool,
         from_interp_rep_transform: Optional[Callable],
         to_interp_rep_transform: Optional[Callable],