cypose/train_classification_model.py at master · cameronlab/cypose · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
# train_classification_model.py --- Train classifier
#
# Filename: train_classification_model.py
# Author: Zach Maas and Clair Huffine
# Created: Tue Dec 19 15:36:15 2023 (-0700)
#
#

# Commentary:
#
# This file contains code to train a basic convolutional classifier on
# segmented movies.
#

# Code:

import torch
import torch.nn as nn
import cv2
import tifffile
from nd2reader import ND2Reader
import numpy as np
import glob as glob
from skimage import io
from tqdm import tqdm
import os
from functools import lru_cache
from torch.utils.tensorboard import SummaryWriter

class ND2DataSet(torch.utils.data.Dataset):
    """
    Faster implementation of the nd2 dataset loader.
    Key improvements:
        - Preload all masks per-file to reduce filesystem thrashing
        - Save processed mask objects to memory to speed up subsequent loads
    If needed we will also implement an async buffer class over top for when there are too many files to fit in memory.
    Future improvements:
        - Write each frame to its own file on disk for our buffer class when dealing with larger than menmory datasets
    """

    def __init__(self, root_dir, cache_path=None, calc_cache=False):
        self.root_dir = root_dir
        self.file_list = glob.glob(f"{root_dir}/*.tiff")
        self.tile_size = 32
        # Make sure we have filesA
        if len(self.file_list) == 0:
            raise ValueError(f"No files found in root directory {root_dir}")
        self.masks = [f.replace(".tiff", "_mask.tif") for f in self.file_list]
        cellnumidx = 0  # Initialize prior to count for total cell index
        if cache_path is None:
            self.cache_path = f"{root_dir}/cache"
            if not os.path.exists(self.cache_path):
                os.mkdir(self.cache_path)
        # Check if we have cached data
        if not calc_cache:
            cached_files = glob.glob(f"{self.cache_path}/*.pth")
            self.length = len(cached_files)
            return
        # Manually start a tqdm progress bar
        pbar = tqdm(desc="Caching cells", unit="cell", total=35000)
        # Iterate over every tif file
        for i, iFile in enumerate(self.file_list):
            print(f"Loading file {i+1} of {len(self.file_list)}, {iFile}")
            filename = iFile
            tif = io.imread(iFile)
            movie, parts = self.getAssocND2(filename)
            for j, iFrame in enumerate(tif):
                _, _, _, centroids = cv2.connectedComponentsWithStats(
                    iFrame, 1, cv2.CV_32S
                )
                movie_frame = self.getMovieFrame(movie, j)
                for centroid in centroids:
                    # Process the mask
                    x, y = centroid[0], centroid[1]
                    cropped_mask, cropped_movie = self.padMask(
                        x, y, iFrame, movie_frame, self.tile_size
                    )
                    # If our mask is empty, skip it
                    if cropped_mask.sum() < 10:
                        #print(f"Skipping empty mask at {x},{y}")
                        continue
                    cell_class = self.oneHotEncode(parts)
                    stacked_movie = self.stackMovieAndMask(cropped_mask, cropped_movie)
                    # Add the sample to the cache
                    sample = {
                        "image": torch.tensor(stacked_movie, dtype=torch.float32),
                        "class": torch.tensor(cell_class, dtype=torch.float32),
                    }
                    cellnumidx += 1
                    # Save the sample to disk
                    torch.save(sample, f"{self.cache_path}/{cellnumidx}_data.pth")
                    # Save a thumbnail too lol
                    # self.generateThumbnails(stacked_movie, cellnumidx)
                    # Update the progress bar
                    pbar.update(1)
        # Calculate the length of the dataset
        cached_files = glob.glob(f"{self.cache_path}/*.pth")
        self.length = len(cached_files)

    def __len__(self):
        return self.length

    @lru_cache(maxsize=1)
    def getAssocND2(self, filename):
        """
        Given a tif filename, load the associated nd2 file
        """
        parts = os.path.basename(filename).split("_")
        date_part = parts[0]
        movie_path = glob.glob(f"{self.root_dir}/{date_part}*.nd2")[0]
        if len(movie_path) == 0:
            raise ValueError(f"No associated ND2 file found for {self.root_dir}/{date_part}*.nd2")
        movie = ND2Reader(movie_path)
        return movie, parts

    @staticmethod
    def getMovieFrame(movie, frame: int):
        """
        Given a movie and a frame, load the frame from the movie
        """
        movie.bundle_axes = ['y', 'x', 'c']
        movie_frame = movie.get_frame(frame)
        frame_array = np.zeros((movie_frame.shape[0], movie_frame.shape[1], 6), dtype=np.float32)
        frame_array[:,:,0:5] = movie_frame
        return frame_array

    @staticmethod
    def padMask(x, y, mask_frame, movie_frame, tile_size):
        """Pad the mask to the correct size"""
        # Make sure our size is even
        size = tile_size
        if size % 2 != 0:
            raise ValueError("Data size must be even for automated padding")
        # Calculate sizes
        half_size = size // 2
        movie_x, movie_y = movie_frame.shape[1], movie_frame.shape[0]
        mask_x, mask_y = mask_frame.shape[1], mask_frame.shape[0]
        # Make sure the mask is the same size as the movie
        if movie_x != mask_x or movie_y != mask_y:
            raise ValueError("Mask and movie must be the same size")
        x_min, x_max = 0, mask_x
        y_min, y_max = 0, mask_y
        x1 = int(max(x - half_size, x_min))
        x2 = int(min(x + half_size, x_max))
        y1 = int(max(y - half_size, y_min))
        y2 = int(min(y + half_size, y_max))
        # Crop the images
        cropped_mask = mask_frame[y1:y2, x1:x2]
        cropped_movie = movie_frame[y1:y2, x1:x2]
        # If the cropped images are too small, augment
        mask_shape = cropped_mask.shape
        if mask_shape[0] < size or mask_shape[1] < size:
            # Pad the images
            cropped_mask = np.pad(
                cropped_mask,
                ((0, size - mask_shape[0]), (0, size - mask_shape[1])),
                "constant",
                constant_values=0,
            )
            cropped_movie = np.pad(
                cropped_movie,
                ((0, size - mask_shape[0]), (0, size - mask_shape[1]), (0, 0)),
                "constant",
                constant_values=0,
            )
        return cropped_mask, cropped_movie

    @staticmethod
    def oneHotEncode(parts):
        # We will need to maintain the classification ID based on what mask its taking the cell from
        cell_class = parts[1]
        class_dict = {  # One-hot encoding
            "WT": [1, 0, 0, 0],
            "cyto": [0, 1, 0, 0],
            "csome": [0, 0, 1, 0],
            "pcsome": [0, 0, 0, 1],
        }
        return class_dict[cell_class]

    @staticmethod
    def oneHotDecode(one_hot):
        # We will need to maintain the classification ID based on what mask its taking the cell from
        class_dict = {  # One-hot encoding
            0: "WT",
            1: "cyto",
            2: "csome",
            3: "pcsome",
        }
        return class_dict[one_hot]

    @staticmethod
    def stackMovieAndMask(cropped_mask, cropped_movie):
        """Stack the movie and mask"""
        cropped_movie[:, :, -1] = cropped_mask
        #if cropped_movie.shape != (self.tile_size,self.tile_size,6):
        #    raise ValueError(f"Movie shape is incorrect. Actual is {cropped_movie.shape}, expected is ({self.tile_size},{self.tile_size},6)")
        return cropped_movie

    # Iterate through dataloader and generate thumbnails for each movie
    def generateThumbnails(self, stacked_movie, cell_num):
        """
        Take a batch of images and generate a tiled 3x2 thumbnail of the 6 channels for each image
        """
        # Make an empty image 🥺
        tiled_image = np.zeros((self.tile_size * 3, self.tile_size * 2))
        # Iterate over each channel
        for channel_num in range(6):
            # Get the image
            channel_image = stacked_movie[:, :, channel_num]
            # Calculate the x and y coordinates
            x = channel_num % 2
            y = channel_num // 2
            # Calculate the x and y coordinates
            x1 = x * self.tile_size
            x2 = x1 + self.tile_size
            y1 = y * self.tile_size
            y2 = y1 + self.tile_size
            # Insert the image into the tiled image
            tiled_image[y1:y2, x1:x2] = channel_image
        # Save the tiled image
        tiled_image = tiled_image.astype(np.uint16)
        io.imsave(f"{self.root_dir}/thumbnails/thumb_c{cell_num}.tif", tiled_image)

    def __getitem__(self, idx):
        if torch.is_tensor(idx):
            idx = idx.tolist()
        # Ooops, off by one
        idx += 1
        # Check if we have already loaded this item
        try:
            data = torch.load(f"{self.cache_path}/{idx}_data.pth")
            return data
        except KeyError:
            raise ValueError("Index not found in cache, someone done goofed.")


class ConvNetClassifier(nn.Module):
    def __init__(self, num_channels, num_classes):
        super(ConvNetClassifier, self).__init__()
        assert 1 <= num_channels <= 6, "num_channels must be between 1 and 6"

        self.conv_layers = nn.Sequential(
            nn.Conv2d(num_channels, 16, kernel_size=3, stride=1, padding=1),
            nn.BatchNorm2d(16),
            nn.LeakyReLU(0.2),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(16, 32, kernel_size=3, stride=1, padding=1),
            nn.BatchNorm2d(32),
            nn.LeakyReLU(0.2),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1),
            nn.BatchNorm2d(64),
            nn.LeakyReLU(0.2),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(64, 128, kernel_size=3, stride=1, padding=1),
            nn.BatchNorm2d(128),
            nn.LeakyReLU(0.2),
            nn.MaxPool2d(kernel_size=2, stride=2)
        )

        self.fc_layers = nn.Sequential(
            nn.Linear(16 * 8 * 4, 256), #change first value to 64 for tile size 64
            nn.LeakyReLU(0.2),
            nn.Linear(256, num_classes),
            # nn.Softmax(dim=1)
        )

    def forward(self, x):
        # Throw away [:,:,:,5] channel
        x = x[:, :, :, 0:5]
        # Train as normal
        x = x.permute(0, 3, 1, 2)
        x = self.conv_layers(x)
        #x = x.view(x.size(0), -1)
        x = torch.flatten(x, 1)
        x = self.fc_layers(x)
        return x

    def predict(self, x):
        with torch.no_grad():
            return torch.argmax(self.forward(x)[0]).item()

# Can we learn anything from our data at all?
# Use an autoencoder to find out
class ConvolutionalAutoencoder(nn.Module):
    def __init__(self):
        super(ConvolutionalAutoencoder, self).__init__()
        self.encoder = nn.Sequential(
            nn.Conv2d(6, 16, kernel_size=3, stride=1, padding=1),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(16, 32, kernel_size=3, stride=1, padding=1),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2)
        )
        self.decoder = nn.Sequential(
            nn.ConvTranspose2d(32, 16, kernel_size=2, stride=2),
            nn.ReLU(),
            nn.ConvTranspose2d(16, 6, kernel_size=2, stride=2),
            nn.ReLU()
        )

    def forward(self, x):
        x = x.permute(0, 3, 1, 2)
        x = self.encoder(x)
        x = self.decoder(x)
        x = x.permute(0, 2, 3, 1)
        return x

if __name__ == "__main__":
    # Load the data
    data = ND2DataSet(
        #root_dir="/Volumes/Extreme SSD/ZachML/CellType"
        root_dir="F:/Cypose/7002/7002Class"
    )  # Manually change to initialize the dataset

    # Print the length of the dataset
    # print(len(data))

    # Define the batch size
    batch_size = 32
    # Split the data into train and test sets
    train_dataset, test_dataset = torch.utils.data.random_split(
        data, [0.999, 0.001]
    )
    train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
    test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=True)

    # Set up the training loop
    # First construct a model to optimize
    model = ConvNetClassifier(num_channels=5, num_classes=4)
    # model = ConvolutionalAutoencoder()
    # First we need to define our optimizer and loss function
    optimizer = torch.optim.Adam(model.parameters(), lr=1e-4)
    # Second we need a loss function. This is classification, so we'll use cross entropy loss
    criterion = nn.CrossEntropyLoss()
    # criterion = nn.MSELoss()

    # Next, we figure out the device that we are training on
    if torch.cuda.is_available():
        print("CUDA is available (GPU)")
        device = torch.device("cuda")
    elif torch.backends.mps.is_available():
        print("MPS is available (M1 Mac)")
        device = torch.device("mps")
    else:
        print("GPU is not available (CPU) :(")
        device = torch.device("cpu")

    # Move the model to the device
    model.to(device)

    # Set up tensorboard
    writer = SummaryWriter()

    # Define an accuracy function
    def model_accuracy(outputs, labels):
        """
        Calcluate per-class accuracy.
        """
        return torch.eq(torch.argmax(outputs, dim=1), torch.argmax(labels, dim=1)).sum() / len(labels)


    # Now we can train the model
    num_epochs = 30
    for epoch in range(num_epochs):
        print(f"Epoch {epoch+1}")
        model.train()
        for i, batch in tqdm(
            enumerate(train_loader), desc="Training", unit="batch", total=len(train_loader)
        ):
            # Get the inputs and labels
            inputs = batch["image"].to(device)
            labels = batch["class"].to(device)

            # Zero the parameter gradients
            optimizer.zero_grad()

            # Forward pass
            outputs = model(inputs)
            # Calculate the loss
            train_loss = criterion(outputs, labels)
            # if i % 50 == 0:
            #     prediction = torch.argmax(outputs, dim=1)
            #     label = torch.argmax(labels, dim=1)
            #     print(prediction)
            #     print(label)
            #     print((prediction == label).sum() / prediction.shape[0])

            # loss = criterion(outputs, inputs)
            # Calculate the accuracy
            train_accuracy = model_accuracy(outputs, labels)

            # Backward pass
            train_loss.backward()  # Calculate the gradients
            optimizer.step()  # Update the weights

            # Print statistics
            # if i % 100 == 0:
            #print(f"Batch {i+1}: loss = {loss.item():.3f}")
            writer.add_scalar("Loss/train", train_loss.item(), epoch * len(train_loader) + i)
            writer.add_scalar("Accuracy/train", train_accuracy.item(), epoch * len(train_loader) + i)

        # Evaluate the model
        # losses = torch.tensor((len(test_loader))).to(device)
        # accuracies = torch.tensor((len(test_loader))).to(device)
        model.eval()
        losses = []
        accuracies = []
        for i, batch in tqdm(
            enumerate(test_loader), desc="Testing", unit="batch", total=len(test_loader)
        ):
            # Get the inputs and labels
            inputs = batch["image"].to(device)
            labels = batch["class"].to(device)

            with torch.no_grad():
                outputs = model(inputs)
                test_loss = criterion(outputs, labels)
                test_accuracy = model_accuracy(outputs, labels)

            # losses[i] = test_loss
            # accuracies[i] = test_accuracy.item()
            losses.append(test_loss)
            accuracies.append(test_accuracy.item())

        # test_loss = losses.mean()
        # test_accuracy = accuracies.mean()
        test_loss = torch.tensor(losses).mean()
        test_accuracy = torch.tensor(accuracies).mean()

        writer.add_scalar("Loss/test", test_loss.item(), epoch * len(train_loader))
        writer.add_scalar("Accuracy/test", test_accuracy.item(), epoch * len(train_loader))

        # Save the model
        print("Saving model...")
        torch.save(model.state_dict(), f"models/7002_test4_classifier_model_{epoch+1}.pth")

# train_classification_model.py ends here