SeldonIO · jklaise · Jan 11, 2023 · Nov 30, 2022 · Jan 5, 2023 · Jan 5, 2023
diff --git a/alibi/explainers/similarity/backends/pytorch/base.py b/alibi/explainers/similarity/backends/pytorch/base.py
@@ -50,8 +50,27 @@ def get_grads(
         loss = loss_fn(output, Y)
         loss.backward()
         model.train(initial_model_state)
-        return np.concatenate([_PytorchBackend.to_numpy(param.grad).reshape(-1)  # type: ignore [arg-type] # see #810
-                               for param in model.parameters()])
+
+        return np.concatenate([_PytorchBackend._grad_to_numpy(grad=param.grad, name=name)
+                               for name, param in model.named_parameters()
+                               if param.grad is not None])
+
+    @staticmethod
+    def _grad_to_numpy(grad: torch.Tensor, name: Optional[str] = None) -> np.ndarray:
+        """Convert gradient to `np.ndarray`.
+
+        Converts gradient tensor to flat `numpy` array. If the gradient is a sparse tensor, it is converted to a dense
+        tensor first.
+        """
+        if grad.is_sparse:
+            grad = grad.to_dense()
+
+        if not hasattr(grad, 'numpy'):
+            name = f' for the named tensor: {name}' if name else ''
+            raise TypeError((f'Could not convert gradient to `numpy` array{name}. To ignore these '
+                             'gradients in the similarity computation set ``requires_grad=False`` on the '
+                             'corresponding parameter.'))
+        return grad.reshape(-1).cpu().numpy()
 
     @staticmethod
     def to_tensor(X: np.ndarray) -> torch.Tensor:
@@ -72,15 +91,32 @@ def set_device(device: Union[str, int, torch.device, None] = None) -> None:
         elif isinstance(device, torch.device):
             _PytorchBackend.device = device
         elif device is not None:
-            raise TypeError(("`device` must be a None, string, integer or "
-                            f"torch.device object. Got {type(device)} instead."))
+            raise TypeError(("`device` must be a ``None``, `string`, `integer` or "
+                            f"`torch.device` object. Got {type(device)} instead."))
 
     @staticmethod
     def to_numpy(X: torch.Tensor) -> np.ndarray:
-        """Maps a `pytorch` tensor to a `numpy` array."""
+        """Maps a `pytorch` tensor to `np.ndarray`."""
         return X.detach().cpu().numpy()
 
     @staticmethod
     def argmax(X: torch.Tensor, dim=-1) -> torch.Tensor:
         """Returns the index of the maximum value in a tensor."""
         return torch.argmax(X, dim=dim)
+
+    @staticmethod
+    def _count_non_trainable(model: nn.Module) -> int:
+        """Returns number of non trainable parameters.
+
+        Returns the number of parameters that are non trainable. If no trainable parameter exists we raise
+        a `ValueError`.
+        """
+
+        num_non_trainable_params = len([param for param in model.parameters() if not param.requires_grad])
+
+        if num_non_trainable_params == len(list(model.parameters())):
+            raise ValueError("The model has no trainable parameters. This method requires at least "
+                             "one trainable parameter to compute the gradients for. "
+                             "Try setting ``.requires_grad_(True)`` on the model or one of its parameters.")
+
+        return num_non_trainable_params
diff --git a/alibi/explainers/similarity/backends/tensorflow/base.py b/alibi/explainers/similarity/backends/tensorflow/base.py
@@ -8,7 +8,7 @@
 
 import numpy as np
 import tensorflow as tf
-import tensorflow.keras as keras
+from tensorflow import keras
 
 
 class _TensorFlowBackend:
@@ -50,9 +50,29 @@ def get_grads(
 
             # compute gradients of the loss w.r.t the weights
             grad_X_train = tape.gradient(loss, model.trainable_weights)
-            grad_X_train = np.concatenate([w.numpy().reshape(-1) for w in grad_X_train])
+            grad_X_train = np.concatenate([_TensorFlowBackend._grad_to_numpy(w, getattr(w, 'name', None))
+                                           for w in grad_X_train])
         return grad_X_train
 
+    @staticmethod
+    def _grad_to_numpy(grad: Union[tf.IndexedSlices, tf.Tensor], name: Optional[str] = None) -> np.ndarray:
+        """Convert gradient to `np.ndarray`.
+
+        Converts gradient tensor to flat `numpy` array. If the gradient is a sparse tensor, it is converted to a dense
+        tensor first.
+        """
+
+        if isinstance(grad, tf.IndexedSlices):
+            # see https://github.com/SeldonIO/alibi/issues/828
+            grad = tf.convert_to_tensor(grad)
+
+        if not hasattr(grad, 'numpy'):
+            name = f' for the named tensor: {name}' if name else ''
+            raise TypeError((f'Could not convert gradient to `numpy` array{name}. To ignore these '
+                             'gradients in the similarity computation set ``trainable=False`` on the '
+                             'corresponding parameter.'))
+        return grad.numpy().reshape(-1)
+
     @staticmethod
     def to_tensor(X: np.ndarray) -> tf.Tensor:
         """Converts a `numpy` array to a `tensorflow` tensor."""
@@ -67,15 +87,29 @@ def set_device(device: Union[str, None] = None) -> None:
         if device is None or isinstance(device, str):
             _TensorFlowBackend.device = device
         else:
-            raise TypeError(f"`device` must be a string or None. Got {type(device)} instead.")
+            raise TypeError(f"`device` must be a `string` or ``None``. Got {type(device)} instead.")
 
     @staticmethod
-    def to_numpy(X: tf.Tensor) -> tf.Tensor:
-        """Converts a tensor to a `numpy` array."""
+    def to_numpy(X: tf.Tensor) -> np.ndarray:
+        """Converts a tensor to `np.ndarray`."""
         return X.numpy()
 
     @staticmethod
     def argmax(X: tf.Tensor, dim=-1) -> tf.Tensor:
         """Returns the index of the maximum value in a tensor."""
         X = tf.math.argmax(X, axis=dim)
         return X
+
+    @staticmethod
+    def _count_non_trainable(model: keras.Model) -> int:
+        """Returns number of non trainable parameters.
+
+        Returns the number of parameters that are non trainable. If no trainable parameter exists we raise
+        a `ValueError`.
+        """
+
+        if len(model.trainable_weights) == 0:
+            raise ValueError("The model has no trainable weights. This method requires at least "
+                             "one trainable parameter to compute the gradients for. "
+                             "Set ``trainable=True`` on the model or a model weight.")
+        return len(model.non_trainable_weights)
diff --git a/alibi/explainers/similarity/grad.py b/alibi/explainers/similarity/grad.py
@@ -7,6 +7,7 @@
 from typing import TYPE_CHECKING, Callable, Optional, Union, Dict, Tuple
 from typing_extensions import Literal
 from enum import Enum
+import warnings
 
 import numpy as np
 
@@ -44,12 +45,12 @@ def __init__(self,
                  device: 'Union[int, str, torch.device, None]' = None,
                  verbose: bool = False,
                  ):
-        """GradientSimilarity explainer.
+        """`GradientSimilarity` explainer.
 
         The gradient similarity explainer is used to find examples in the training data that the predictor considers
         similar to test instances the user wants to explain. It uses the gradients of the loss between the model output
         and the training data labels. These are compared using the similarity function specified by ``sim_fn``. The
-        GradientSimilarity can be applied to models trained for both classification and regression tasks.
+        `GradientSimilarity` explainer can be applied to models trained for both classification and regression tasks.
 
 
         Parameters
@@ -128,13 +129,23 @@ def __init__(self,
             task_name=task
         )
 
+        num_non_trainable = self.backend._count_non_trainable(self.predictor)
+        if num_non_trainable:
+            warning_msg = (f"Found {num_non_trainable} non-trainable parameters in the model. These parameters "
+                           "don't have gradients and will not be included in the computation of gradient similarity."
+                           " This might be because your model has layers that track statistics using non-trainable "
+                           "parameters such as batch normalization layers. In this case, you don't need to worry. "
+                           "Otherwise it's because you have set some parameters to be non-trainable and alibi is "
+                           "letting you know.")
+            warnings.warn(warning_msg)
+
     def fit(self,
             X_train: np.ndarray,
             Y_train: np.ndarray) -> "Explainer":
         """Fit the explainer.
 
-        The GradientSimilarity explainer requires the model gradients over the training data. In the explain method it
-        compares them to the model gradients for the test instance(s). If ``store_grads`` was set to ``True`` on
+        The `GradientSimilarity` explainer requires the model gradients over the training data. In the explain method
+        it compares them to the model gradients for the test instance(s). If ``precompute_grads=True`` on
         initialization then the gradients are precomputed here and stored. This will speed up the explain method call
         but storing the gradients may not be feasible for large models.
 

diff --git a/alibi/explainers/tests/test_simiarlity/conftest.py b/alibi/explainers/tests/test_simiarlity/conftest.py
@@ -148,9 +148,10 @@ def tf_linear_model(input_shape, output_shape):
     Constructs a linear model for `tensorflow`.
     """
     return keras.Sequential([
-        keras.layers.InputLayer(input_shape=input_shape),
-        keras.layers.Dense(output_shape),
-        keras.layers.Softmax()
+        tf.keras.layers.InputLayer(input_shape=input_shape),
+        tf.keras.layers.Flatten(),
+        tf.keras.layers.Dense(output_shape),
+        tf.keras.layers.Softmax()
     ])
 
 

diff --git a/alibi/explainers/tests/test_simiarlity/test_backends.py b/alibi/explainers/tests/test_simiarlity/test_backends.py
@@ -2,6 +2,7 @@
 
 import torch
 import numpy as np
+import tensorflow as tf
 
 from alibi.explainers.similarity.backends.tensorflow.base import _TensorFlowBackend
 from alibi.explainers.similarity.backends.pytorch.base import _PytorchBackend
@@ -41,3 +42,94 @@ def test_backends(random_cls_dataset, linear_models):
     torch_grads = np.sort(torch_grads)
     tf_grads = np.sort(tf_grads)
     np.testing.assert_allclose(torch_grads, tf_grads, rtol=1e-04)
+
+
+@pytest.mark.parametrize('trainable_emd, grads_shape', [(True, (61, )), (False, (21, ))])
+def test_tf_embedding_similarity(trainable_emd, grads_shape):
+    """Test `GradientSimilarity` explainer correctly handles sparsity and non-trainable layers for `tensorflow`.
+
+    Test that `tensorflow` embedding layers work as expected and also that layers
+    marked as non-trainable are not included in the gradients.
+    See https://github.com/SeldonIO/alibi/issues/828.
+    """
+    model = tf.keras.models.Sequential([
+        tf.keras.layers.Embedding(10, 4, input_shape=(5,), trainable=trainable_emd),
+        tf.keras.layers.Flatten(),
+        tf.keras.layers.Dense(1)
+    ])
+
+    X = tf.random.uniform(shape=(1, 5), minval=0, maxval=10, dtype=tf.float32)
+    Y = tf.random.uniform(shape=(1, 1), minval=0, maxval=10, dtype=tf.float32)
+    loss_fn = tf.keras.losses.MeanSquaredError()
+    tf_grads = _TensorFlowBackend.get_grads(model, X, Y, loss_fn)
+    assert tf_grads.shape == grads_shape  # (4 * 10) * trainable_emd + (5 * 4) + 1
+
+
+@pytest.mark.parametrize('trainable_emd, grads_shape', [(True, (61, )), (False, (21, ))])
+@pytest.mark.parametrize('sparse', [True, False])
+def test_pytorch_embedding_similarity(trainable_emd, grads_shape, sparse):
+    """Test GradientSimilarity explainer correctly handles sparsity and non-trainable layers for pytorch.
+
+    Tests that the `pytorch` embedding layers work as expected and that layers marked as
+    non-trainable are not included in the gradients.
+    """
+
+    model = torch.nn.Sequential(
+        torch.nn.Embedding(10, 4, 5, sparse=sparse),
+        torch.nn.Flatten(),
+        torch.nn.LazyLinear(1)
+    )
+
+    model[0].weight.requires_grad = trainable_emd
+
+    X = torch.randint(0, 10, (1, 5))
+    Y = torch.randint(0, 10, (1, 1), dtype=torch.float32)
+    loss_fn = torch.nn.MSELoss()
+    pt_grads = _PytorchBackend.get_grads(model, X, Y, loss_fn)
+    assert pt_grads.shape == grads_shape  # (4 * 10) * trainable_emd + (5 * 4) + 1
+
+
+def test_non_numpy_grads_pytorch():
+    """Test that the `pytorch` backend handles gradients withtout `numpy` methods correctly.
+
+    `_PytorchBackend` should throw an error if the gradients cannot be converted to numpy arrays.
+    """
+    class MockTensor():
+        is_sparse = False
+
+    with pytest.raises(TypeError) as err:
+        _PytorchBackend._grad_to_numpy(MockTensor())
+
+    assert ("Could not convert gradient to `numpy` array. To ignore these gradients in the "
+            "similarity computation set ``requires_grad=False`` on the corresponding parameter.") \
+        in str(err.value)
+
+    with pytest.raises(TypeError) as err:
+        _PytorchBackend._grad_to_numpy(MockTensor(), 'test')
+
+    assert ("Could not convert gradient to `numpy` array for the named tensor: test. "
+            "To ignore these gradients in the similarity computation set ``requires_grad=False``"
+            " on the corresponding parameter.") in str(err.value)
+
+
+def test_non_numpy_grads_tensorflow():
+    """Test that the `tensorflow` backend handles gradients without `numpy` methods correctly.
+
+    `_TensorFlowBackend` should throw an error if the gradients cannot be converted to `numpy` arrays.
+    """
+    class MockTensor():
+        is_sparse = False
+
+    with pytest.raises(TypeError) as err:
+        _TensorFlowBackend._grad_to_numpy(MockTensor())
+
+    assert ("Could not convert gradient to `numpy` array. To ignore these gradients "
+            "in the similarity computation set ``trainable=False`` on the corresponding parameter.") \
+        in str(err.value)
+
+    with pytest.raises(TypeError) as err:
+        _TensorFlowBackend._grad_to_numpy(MockTensor(), 'test')
+
+    assert ("Could not convert gradient to `numpy` array for the named tensor: test."
+            " To ignore these gradients in the similarity computation set "
+            "``trainable=False`` on the corresponding parameter.") in str(err.value)