refactor feature ablation (#1047)

aobo-y · facebook-github-bot · commit 5f878af6a74a · 2022-10-20T13:14:05.000-07:00
Summary: - refactor to feature ablation to make the logic about multi-output attribution more readable - removed some (outdated) misleading comments - add more comments to explain the steps and tensor shapes Pull Request resolved: #1047 Reviewed By: vivekmig Differential Revision: D40388808 Pulled By: aobo-y fbshipit-source-id: fb105a302fe3eeef302a1c50e39847e783bb48e2
diff --git a/captum/attr/_core/feature_ablation.py b/captum/attr/_core/feature_ablation.py
@@ -286,22 +286,20 @@ def attribute(
             if show_progress:
                 attr_progress.update()
 
+            # number of elements in the output of forward_func
+            n_outputs = initial_eval.numel() if isinstance(initial_eval, Tensor) else 1
+
+            # flatten eval outputs into 1D (n_outputs)
+            # add the leading dim for n_feature_perturbed
+            if isinstance(initial_eval, Tensor):
+                initial_eval = initial_eval.reshape(1, -1)
+
             agg_output_mode = FeatureAblation._find_output_mode(
                 perturbations_per_eval, feature_mask
             )
 
-            # get as a 2D tensor (if it is not a scalar)
-            if isinstance(initial_eval, torch.Tensor):
-                initial_eval = initial_eval.reshape(1, -1)
-                num_outputs = initial_eval.shape[1]
-            else:
-                num_outputs = 1
-
             if not agg_output_mode:
-                assert (
-                    isinstance(initial_eval, torch.Tensor)
-                    and num_outputs == num_examples
-                ), (
+                assert isinstance(initial_eval, Tensor) and n_outputs == num_examples, (
                     "expected output of `forward_func` to have "
                     + "`batch_size` elements for perturbations_per_eval > 1 "
                     + "and all feature_mask.shape[0] > 1"
@@ -316,8 +314,9 @@ def attribute(
             )
 
             total_attrib = [
+                # attribute w.r.t each output element
                 torch.zeros(
-                    (num_outputs,) + input.shape[1:],
+                    (n_outputs,) + input.shape[1:],
                     dtype=attrib_type,
                     device=input.device,
                 )
@@ -328,7 +327,7 @@ def attribute(
             if self.use_weights:
                 weights = [
                     torch.zeros(
-                        (num_outputs,) + input.shape[1:], device=input.device
+                        (n_outputs,) + input.shape[1:], device=input.device
                     ).float()
                     for input in inputs
                 ]
@@ -354,8 +353,11 @@ def attribute(
                     perturbations_per_eval,
                     **kwargs,
                 ):
-                    # modified_eval dimensions: 1D tensor with length
-                    # equal to #num_examples * #features in batch
+                    # modified_eval has (n_feature_perturbed * n_outputs) elements
+                    # shape:
+                    #   agg mode: (*initial_eval.shape)
+                    #   non-agg mode:
+                    #     (feature_perturbed * batch_size, *initial_eval.shape[1:])
                     modified_eval = _run_forward(
                         self.forward_func,
                         current_inputs,
@@ -366,25 +368,34 @@ def attribute(
                     if show_progress:
                         attr_progress.update()
 
-                    # (contains 1 more dimension than inputs). This adds extra
-                    # dimensions of 1 to make the tensor broadcastable with the inputs
-                    # tensor.
                     if not isinstance(modified_eval, torch.Tensor):
                         eval_diff = initial_eval - modified_eval
                     else:
                         if not agg_output_mode:
+                            # current_batch_size is not n_examples
+                            # it may get expanded by n_feature_perturbed
+                            current_batch_size = current_inputs[0].shape[0]
                             assert (
-                                modified_eval.numel() == current_inputs[0].shape[0]
+                                modified_eval.numel() == current_batch_size
                             ), """expected output of forward_func to grow with
                             batch_size. If this is not the case for your model
                             please set perturbations_per_eval = 1"""
 
-                        eval_diff = (
-                            initial_eval - modified_eval.reshape((-1, num_outputs))
-                        ).reshape((-1, num_outputs) + (len(inputs[i].shape) - 1) * (1,))
+                        # reshape the leading dim for n_feature_perturbed
+                        # flatten each feature's eval outputs into 1D of (n_outputs)
+                        modified_eval = modified_eval.reshape(-1, n_outputs)
+                        # eval_diff in shape (n_feature_perturbed, n_outputs)
+                        eval_diff = initial_eval - modified_eval
+
+                        # append the shape of one input example
+                        # to make it broadcastable to mask
+                        eval_diff = eval_diff.reshape(
+                            eval_diff.shape + (inputs[i].dim() - 1) * (1,)
+                        )
                         eval_diff = eval_diff.to(total_attrib[i].device)
                     if self.use_weights:
                         weights[i] += current_mask.float().sum(dim=0)
+
                     total_attrib[i] += (eval_diff * current_mask.to(attrib_type)).sum(
                         dim=0
                     )