RotNet-FA-Baseline/rotnet3D_regression.py at main · MASILab/RotNet-FA-Baseline · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
"""
Copyright (c) 2025. All rights reserved.
RotNet-FA-Image: Rotation Prediction for FA Maps
Author: Yehyun  Suh
Description: This script implements a deep learning model using PyTorch for predicting rotation angles of 3D fractional anisotropy maps.
License: This script is provided "as-is" without warranty of any kind. Use at your own risk.
"""

import os
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import Dataset, DataLoader
import nibabel as nib
import numpy as np
from scipy.ndimage import rotate
from tqdm import tqdm
import matplotlib.pyplot as plt

class NiiDataset(Dataset):
    """
    Custom Dataset to load and preprocess NIfTI (.nii.gz) files for training.

    Args:
        data_dir (str): Directory containing .nii.gz files.

    Raises:
        ValueError: If no .nii.gz files are found in the specified directory.
    """
    def __init__(self, data_dir):
        super().__init__()
        self.data_dir = data_dir
        self.files = [
            os.path.join(root, f)
            for root, _, filenames in os.walk(data_dir)
            for f in filenames if f.endswith('.nii.gz')
        ]
        if not self.files:
            raise ValueError(f"No .nii.gz files found in {data_dir}.")

        # Generate x-axis rotation angles for each sample
        self.samples = [(file_path, np.random.uniform(0, 360)) for file_path in self.files]

    def __len__(self):
        return len(self.samples)

    def __getitem__(self, idx):
        file_path, angle = self.samples[idx]

        try:
            img = nib.load(file_path).get_fdata()
            img = self.preprocess_fa_map(img)
            if img is None:
                return torch.full((1, 64, 64, 64), float('nan')), torch.tensor([angle])

            img_rotated = self.rotate_image(img, angle)
            return torch.tensor(img_rotated, dtype=torch.float32).unsqueeze(0), torch.tensor([angle], dtype=torch.float32)

        except Exception as e:
            print(f"Error processing {file_path}: {e}")
            return torch.full((1, 64, 64, 64), float('nan')), torch.tensor([angle])

    @staticmethod
    def preprocess_fa_map(img):
        """
        Preprocess an FA map by normalizing intensities and resizing to 64x64x64.

        Args:
            img (numpy.ndarray): Input 3D image.

        Returns:
            numpy.ndarray: Preprocessed 3D image or None if invalid.
        """
        img = np.nan_to_num(img, nan=0.0, posinf=1.0, neginf=0.0)
        if np.all(img == 0) or np.max(img) - np.min(img) < 1e-6:
            return None

        img = torch.tensor(img, dtype=torch.float32).unsqueeze(0).unsqueeze(0)
        img = torch.nn.functional.interpolate(img, size=(64, 64, 64), mode='trilinear', align_corners=False)
        img = img.squeeze().numpy()

        p1, p99 = np.percentile(img[img > 0], [1, 99])
        img = np.clip(img, p1, p99)
        return (img - p1) / (p99 - p1)

    @staticmethod
    def rotate_image(img, angle):
        """
        Rotate a 3D image along the x-axis.

        Args:
            img (numpy.ndarray): Input 3D image.
            angle (float): Rotation angle in degrees.

        Returns:
            numpy.ndarray: Rotated 3D image.
        """
        return rotate(img, angle=angle, axes=(1, 2), reshape=False)


class RotationRegressionModel(nn.Module):
    """
    3D Convolutional Neural Network for regression of rotation angles.
    """
    def __init__(self):
        super(RotationRegressionModel, self).__init__()
        self.conv_layers = nn.Sequential(
            nn.Conv3d(1, 32, kernel_size=3, padding=1),
            nn.BatchNorm3d(32),
            nn.ReLU(),
            nn.MaxPool3d(2),

            nn.Conv3d(32, 64, kernel_size=3, padding=1),
            nn.BatchNorm3d(64),
            nn.ReLU(),
            nn.MaxPool3d(2),

            nn.Conv3d(64, 128, kernel_size=3, padding=1),
            nn.BatchNorm3d(128),
            nn.ReLU(),
            nn.MaxPool3d(2),

            nn.Conv3d(128, 256, kernel_size=3, padding=1),
            nn.BatchNorm3d(256),
            nn.ReLU(),
            nn.MaxPool3d(2),

            nn.Conv3d(256, 512, kernel_size=3, padding=1),
            nn.BatchNorm3d(512),
            nn.ReLU(),
            nn.MaxPool3d(2)
        )

        self.fc_size = self._calculate_fc_size()

        self.fc1 = nn.Linear(self.fc_size, 512)
        self.fc2 = nn.Linear(512, 256)
        self.fc3 = nn.Linear(256, 128)
        self.fc4 = nn.Linear(128, 1)

    def _calculate_fc_size(self):
        """
        Calculate the size of the flattened feature vector from convolutional layers.

        Returns:
            int: Flattened feature vector size.
        """
        dummy_input = torch.zeros(1, 1, 64, 64, 64)
        output = self.conv_layers(dummy_input)
        return output.numel()

    def forward(self, x):
        """
        Forward pass of the model.

        Args:
            x (torch.Tensor): Input tensor of shape (batch_size, 1, 64, 64, 64).

        Returns:
            torch.Tensor: Predicted rotation angles of shape (batch_size, 1).
        """
        x = self.conv_layers(x)
        x = x.view(-1, self.fc_size)
        x = nn.functional.relu(self.fc1(x))
        x = nn.functional.relu(self.fc2(x))
        x = nn.functional.relu(self.fc3(x))
        return self.fc4(x)


def visualize_sample(model, dataset, device, epoch, sample_idx=0):
    """
    Visualize the prediction of a single sample from the dataset.

    Args:
        model (torch.nn.Module): The trained PyTorch model for rotation angle prediction.
        dataset (Dataset): The dataset containing the input images and true angles.
        device (torch.device): The device (CPU or GPU) on which the model is running.
        epoch (int): The current epoch number, used for saving visualizations.
        sample_idx (int, optional): The index of the sample to visualize. Defaults to 0.

    Returns:
        None. Saves a visualization of the original and rotated image with predicted and true rotation angles.
    """
    # Set the model to evaluation mode and disable gradient computation
    model.eval()
    with torch.no_grad():
        # Retrieve the input image and true angle for the specified sample
        input_image, true_angle = dataset[sample_idx]

        # Check if the input image contains invalid values
        if torch.isnan(input_image).any():
            print(f"Skipping visualization for sample {sample_idx} - invalid data")
            return

        # Prepare the input tensor for the model by adding a batch dimension and moving to the device
        input_tensor = input_image.unsqueeze(0).to(device)

        # Predict the rotation angle using the model
        predicted_angle = model(input_tensor)

        # Extract the middle slices from the 3D image for visualization
        mid_slice_xy = input_image[0, input_image.shape[1] // 2, :, :]
        mid_slice_yz = input_image[0, :, input_image.shape[2] // 2, :]
        mid_slice_xz = input_image[0, :, :, input_image.shape[3] // 2]

        # Create a figure for displaying the original and rotated images
        fig, axes = plt.subplots(2, 3, figsize=(15, 10))

        # Plot the original image slices
        axes[0, 0].imshow(mid_slice_xy, cmap='gray')
        axes[0, 0].set_title('Original - XY Plane')
        axes[0, 1].imshow(mid_slice_yz, cmap='gray')
        axes[0, 1].set_title('Original - YZ Plane')
        axes[0, 2].imshow(mid_slice_xz, cmap='gray')
        axes[0, 2].set_title('Original - XZ Plane')

        # Apply the true rotation to the original image for comparison
        rotated_image = dataset.rotate_image(input_image[0].numpy(), true_angle.item())

        # Extract the middle slices from the rotated image
        mid_rotated_xy = rotated_image[rotated_image.shape[0] // 2, :, :]
        mid_rotated_yz = rotated_image[:, rotated_image.shape[1] // 2, :]
        mid_rotated_xz = rotated_image[:, :, rotated_image.shape[2] // 2]

        # Plot the rotated image slices
        axes[1, 0].imshow(mid_rotated_xy, cmap='gray')
        axes[1, 0].set_title('Rotated - XY Plane')
        axes[1, 1].imshow(mid_rotated_yz, cmap='gray')
        axes[1, 1].set_title('Rotated - YZ Plane')
        axes[1, 2].imshow(mid_rotated_xz, cmap='gray')
        axes[1, 2].set_title('Rotated - XZ Plane')

        # Add a title summarizing the true and predicted angles
        plt.suptitle(f'Epoch {epoch + 1}\n'
                     f'True X-axis rotation: {true_angle.item():.1f}°\n'
                     f'Predicted X-axis rotation: {predicted_angle.item():.1f}°')

        # Adjust the layout and save the figure
        plt.tight_layout()
        os.makedirs(f'result_regression/epoch_{epoch + 1}', exist_ok=True)
        plt.savefig(f'result_regression/epoch_{epoch + 1}/sample_prediction_{sample_idx}.png')
        plt.close()


def train_model(data_dir, batch_size=8, epochs=20, lr=1e-3):
    """
    Train the rotation regression model on the given dataset.

    Args:
        data_dir (str): Directory containing NIfTI files.
        batch_size (int): Number of samples per batch.
        epochs (int): Number of training epochs.
        lr (float): Learning rate for optimizer.

    Returns:
        model (RotationRegressionModel): Trained model.
        list: Training loss for each epoch.
    """
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    dataset = NiiDataset(data_dir)
    dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True, num_workers=4, drop_last=True)

    model = RotationRegressionModel().to(device)
    criterion = nn.MSELoss()
    optimizer = optim.AdamW(model.parameters(), lr=lr, weight_decay=0.01)
    scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, mode='min', factor=0.5, patience=5)

    train_losses = []

    for epoch in range(epochs):
        model.train()
        running_loss = 0.0

        for inputs, angles in tqdm(dataloader, desc=f"Epoch {epoch + 1}/{epochs}"):
            if torch.isnan(inputs).any():
                continue

            inputs, angles = inputs.to(device), angles.to(device)
            optimizer.zero_grad()
            predicted_angles = model(inputs)
            loss = criterion(predicted_angles, angles)
            loss.backward()
            optimizer.step()

            running_loss += loss.item()

        epoch_loss = running_loss / len(dataloader)
        train_losses.append(epoch_loss)
        scheduler.step(epoch_loss)

        print(f"Epoch {epoch + 1}/{epochs}, Loss: {epoch_loss:.4f}")
        if epoch == 0 or (epoch+1) % 5 == 0:
            for sample_idx in range(min(10, len(dataset))):
                visualize_sample(model, dataset, device, epoch, sample_idx)

    return model, train_losses


if __name__ == "__main__":
    DATA_DIR = "data"
    BATCH_SIZE = 18
    EPOCHS = 100
    LR = 1e-3

    model, losses = train_model(DATA_DIR, BATCH_SIZE, EPOCHS, LR)

    # Save final model weights
    weights_fc4 = model.fc4.weight.detach().cpu().numpy().T
    np.save("vectors.npy", weights_fc4)