PyHealth/pyhealth/interpret/methods/basic_gradient.py at dec963c1c26fcd98b0f66659dfe36f6a00faf2aa · sunlabuiuc/PyHealth · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
import torch
import numpy as np
from typing import Dict
from pyhealth.interpret.methods.base_interpreter import BaseInterpreter

class BasicGradientSaliencyMaps(BaseInterpreter):
    """Compute gradient-based saliency maps for image classification models.

    This class generates saliency maps by computing gradients of model predictions with respect
    to input pixels, highlighting regions that most influenced the prediction. The saliency is
    computed by taking the maximum absolute gradient across color channels.

    The method is particularly useful for:

    - **Clinical interpretability**: Understanding which image regions drove a diagnosis
    - **Model debugging**: Verifying the model focuses on clinically relevant features
    - **Trust and transparency**: Providing visual explanations for predictions
    - **Error analysis**: Comparing saliency maps for correct vs. incorrect predictions

    Algorithm:
        1. Forward pass: Compute model predictions for input batch
        2. Target selection: Use predicted class (argmax of probabilities)
        3. Backward pass: Compute gradients with respect to input pixels
        4. Saliency map: Take absolute value and max across color channels

    Mathematical formula:
        saliency(x, y) = max_c |∂score_predicted / ∂pixel_{x,y,c}|
        where c iterates over color channels (RGB or grayscale)

    Examples:
        Basic usage with a batch::

            from pyhealth.interpret.methods.basic_gradient import BasicGradientSaliencyMaps
            import matplotlib.pyplot as plt

            # Create batch
            batch = {
                'image': torch.randn(2, 3, 224, 224),
                'disease': torch.tensor([0, 1])
            }

            # Compute saliency maps
            saliency = BasicGradientSaliencyMaps(model, input_batch=batch)

            # Visualize
            saliency.visualize_saliency_map(
                plt,
                image_index=0,
                title="Saliency Map",
                id2label={0: "Normal", 1: "COVID"}
            )

        Using the attribute() interface::

            # Initialize without batch
            saliency = BasicGradientSaliencyMaps(model)

            # Compute attributions for new data
            attributions = saliency.attribute(**batch)
            # Returns: {'image': tensor with saliency maps}

            # Save to batch history
            attributions = saliency.attribute(save_to_batch=True, **batch)

    Note:
        - Do not use within ``torch.no_grad()`` context as gradients are required
        - Works with any PyHealth image classification model
        - For best results, normalize input images consistently with training

    See Also:
        - ``examples/ChestXrayClassificationWithSaliency.ipynb``: Complete tutorial
        - :class:`~pyhealth.interpret.methods.IntegratedGradients`: Alternative attribution method
    """
    def __init__(self, model, input_batch=None, image_key='image', label_key='disease'):
        """Initialize the saliency map generator.

        Args:
            model: PyHealth model with forward method expecting image and disease kwargs
            input_batch: Optional batch of data as dictionary, list, or tensor.
                        If None, use attribute() method to compute saliency maps.
            image_key: Key for accessing images in samples (default: 'image')
            label_key: Key for accessing labels in samples (default: 'disease')
        """
        # Validate that input_batch is either a dictionary, list, tensor, or None
        if input_batch is not None and not isinstance(input_batch, (dict, list, torch.Tensor)):
            raise ValueError("input_batch must be a dictionary, list, tensor, or None")

        # Call parent constructor
        super().__init__(model)

        # Store additional attributes specific to this class
        self.Model = model  # Keep for backward compatibility
        self.Input_batch = input_batch
        self.Image_key = image_key
        self.Label_key = label_key
        self.Batch_saliency_maps = []

        # Compute saliency maps if input_batch was provided
        if input_batch is not None:
            self._compute_saliency_maps()

    def attribute(self, save_to_batch=False, **data) -> Dict[str, torch.Tensor]:
        """Compute attribution scores for input features.

        This method implements the BaseInterpreter interface by computing
        gradient-based saliency maps for the input images.

        Args:
            save_to_batch: If True, save results to Batch_saliency_maps (default: False)
            **data: Input data dictionary containing 'image' and optionally 'disease' keys

        Returns:
            Dict[str, torch.Tensor]: Dictionary with 'saliency' key mapping to saliency map tensor
        """
        # Process the batch
        if isinstance(data, (list, torch.Tensor)):
            batch_dict = {
                self.Image_key: data[0] if isinstance(data, list) else data,
                self.Label_key: data[1] if isinstance(data, list) else None
            }
        else:
            batch_dict = data

        # Prepare input tensors
        imgs = batch_dict[self.Image_key]
        batch_images = imgs.clone().detach().requires_grad_()
        batch_labels = batch_dict.get(self.Label_key, None)

        # Get model predictions
        output = self.model(image=batch_images, disease=batch_labels)
        y_prob = output['y_prob']
        target_class = y_prob.argmax(dim=1)
        scores = y_prob.gather(1, target_class.unsqueeze(1)).squeeze()

        # Compute gradients
        self.model.zero_grad()
        scores.sum().backward()

        # Process gradients into saliency map
        sal = batch_images.grad.abs()
        sal, _ = torch.max(sal, dim=1)  # Max across channels

        # Save to Batch_saliency_maps if requested
        if save_to_batch:
            result = {
                'saliency': sal,
                'image': batch_images,
                'label': batch_labels
            }
            self.Batch_saliency_maps.append(result)

        return {self.Image_key: sal}

    def get_gradient_saliency_maps(self):
        """Retrieve gradient saliency maps.

        Returns:
            list: Batch saliency map results
        """
        return self.Batch_saliency_maps

    def _compute_saliency_maps(self):
        """Compute gradient saliency maps for input batch."""
        if self.Input_batch is None:
            return  # Nothing to compute

        self.Model.eval()

        if isinstance(self.Input_batch, (list, torch.Tensor)):
            # If input_batch is a list or tensor, wrap it in a dictionary
            batch_dict = {
                self.Image_key: self.Input_batch[0] if isinstance(self.Input_batch, list) else self.Input_batch,
                self.Label_key: self.Input_batch[1] if isinstance(self.Input_batch, list) else None
            }
            self._process_batch(batch_dict)
        else:
            # Assume it's already a dictionary
            self._process_batch(self.Input_batch)

    def _process_batch(self, batch):
        """Process a batch of inputs to generate saliency maps.

        This method wraps the attribute() method to maintain backward compatibility
        with the original batch processing API.

        Args:
            batch: Dictionary containing image and label tensors with keys
                  matching self.Image_key and self.Label_key
        """
        # Use attribute method to compute saliency
        attributions = self.attribute(**batch)

        # Extract the saliency map from attributions
        sal = attributions[self.Image_key]

        # Prepare input tensors for storing complete results
        imgs = batch[self.Image_key]
        batch_images = imgs.clone().detach().requires_grad_()
        batch_labels = batch[self.Label_key]

        # Store results in the original format for backward compatibility
        result = {
            'saliency': sal,
            'image': batch_images,
            'label': batch_labels
        }

        self.Batch_saliency_maps.append(result)

    def visualize_saliency_map(self, plt, *, image_index, title=None, id2label=None, alpha=0.3):
        """Display an image with its saliency map overlay.

        This method uses the SaliencyVisualizer for rendering and adds model
        prediction information to the visualization.

        Args:
            plt: matplotlib.pyplot instance
            image_index: Index of image within batch
            title: Optional title for the plot
            id2label: Optional dictionary mapping class indices to labels
            alpha: Transparency of saliency overlay (default: 0.3)
        """
        from pyhealth.interpret.methods.saliency_visualization import SaliencyVisualizer

        if plt is None:
            import matplotlib.pyplot as plt

        # Check if input_batch is available
        if self.Input_batch is None:
            raise ValueError("Cannot visualize: no input_batch was provided during initialization")

        # Get image from input batch
        img_tensor = self.Input_batch[self.Image_key][image_index]
        true_label = self.Input_batch[self.Label_key][image_index].item()

        # Ensure input is a tensor with correct shape
        if img_tensor.dim() == 3:
            img_tensor = img_tensor.unsqueeze(0)
        if img_tensor.dim() != 4:
            raise ValueError(f"Expected 4D tensor (batch, channels, height, width), got shape {img_tensor.shape}")

        # Compute saliency
        img_tensor = img_tensor.clone().requires_grad_(True)

        # Create a dummy label tensor of zeros for the forward pass
        dummy_label = torch.zeros(img_tensor.size(0), dtype=torch.long, device=img_tensor.device)

        output = self.Model(image=img_tensor, disease=dummy_label)
        pred_class = torch.argmax(output['y_prob']).item()

        # Backward pass
        self.Model.zero_grad()
        output['y_prob'][:, pred_class].backward()

        # Get saliency map
        saliency = torch.max(img_tensor.grad.abs(), dim=1)[0]

        # Add both true label and predicted class to title
        if id2label is not None:
            true_label_str = id2label[true_label]
            pred_label_str = id2label[pred_class]
            if title is None:
                title = f"True: {true_label_str}, Predicted: {pred_label_str}"
            else:
                title = f"{title} - True: {true_label_str}, Predicted: {pred_label_str}"

        # Use SaliencyVisualizer for rendering
        visualizer = SaliencyVisualizer(default_alpha=alpha)
        visualizer.plot_saliency_overlay(
            plt,
            image=img_tensor[0],
            saliency=saliency,
            title=title,
            alpha=alpha
        )