adding resnet related scripts

a-rouxel · Mar 9, 2024 · 71cf609 · 71cf609
1 parent 73add40
commit 71cf609
Show file tree

Hide file tree

Showing 2 changed files with 424 additions and 0 deletions.
diff --git a/optimization_modules_with_resnet.py b/optimization_modules_with_resnet.py
@@ -0,0 +1,372 @@
+import pytorch_lightning as pl
+import torch
+import torch.nn as nn
+from simca.CassiSystem_lightning import CassiSystemOptim
+from MST.simulation.train_code.architecture import *
+from simca import  load_yaml_config
+import matplotlib.pyplot as plt
+import torchvision
+import numpy as np
+from simca.functions_acquisition import *
+from piqa import SSIM
+from torch.utils.tensorboard import SummaryWriter
+import io
+import torchvision.transforms as transforms
+from PIL import Image
+import segmentation_models_pytorch as smp
+import torch.nn.functional as F
+
+class UnetModel(nn.Module):
+    def __init__(self,encoder_name="resnet18",encoder_weights="",in_channels=1,classes=2,index=0):
+        super().__init__()
+        self.i= index
+        self.model= smp.Unet(encoder_name= encoder_name, in_channels=in_channels,encoder_weights=encoder_weights,classes=classes,activation='sigmoid')
+    def forward(self,x):
+        x= self.model(x)
+        return x
+
+
+class JointReconstructionModule_V2(pl.LightningModule):
+
+    def __init__(self, model_name,log_dir="tb_logs",reconstruction_checkpoint=None):
+        super().__init__()
+
+        self.model_name = model_name
+        # TODO : use a real reconstruction module
+        self.reconstruction_model = model_generator(self.model_name, pretrained_model_path=reconstruction_checkpoint)
+        self.mask_generation = UnetModel(classes=1,encoder_weights=None,in_channels=1)
+
+        self.loss_fn = nn.MSELoss()
+        self.ssim_loss = SSIM(window_size=11, size_average=True)
+
+        self.writer = SummaryWriter(log_dir)
+
+    def on_validation_start(self,stage=None):
+        print("---VALIDATION START---")
+        self.config = "simca/configs/cassi_system_optim_optics_full_triplet_dd_cassi.yml"
+        config_system = load_yaml_config(self.config)
+        self.config_patterns = load_yaml_config("simca/configs/pattern.yml")
+        self.cassi_system = CassiSystemOptim(system_config=config_system)
+        self.cassi_system.propagate_coded_aperture_grid()
+
+    def _normalize_data_by_itself(self, data):
+        # Calculate the mean and std for each batch individually
+        # Keep dimensions for broadcasting
+        mean = torch.mean(data, dim=[1, 2], keepdim=True)
+        std = torch.std(data, dim=[1, 2], keepdim=True)
+
+        # Normalize each batch by its mean and std
+        normalized_data = (data - mean) / std
+        return normalized_data
+
+
+    def forward(self, x):
+        print("---FORWARD---")
+
+        hyperspectral_cube, wavelengths = x
+        hyperspectral_cube = hyperspectral_cube.permute(0, 2, 3, 1).to(self.device)
+        batch_size, H, W, C = hyperspectral_cube.shape
+
+
+        self.pattern = self.cassi_system.generate_2D_pattern(self.config_patterns,nb_of_patterns=batch_size)
+        self.pattern = self.pattern.to(self.device)
+        filtering_cube = self.cassi_system.generate_filtering_cube().to(self.device)
+        self.acquired_image1 = self.cassi_system.image_acquisition(hyperspectral_cube, self.pattern, wavelengths).to(self.device)
+
+        self.acquired_image1 = pad_tensor(self.acquired_image1, (128, 128))
+
+        # flip along second and thrid axis
+        self.acquired_image1 = self.acquired_image1.flip(1)
+        self.acquired_image1 = self.acquired_image1.flip(2) 
+        self.acquired_image1 = self.acquired_image1.unsqueeze(1).float()
+
+        self.pattern = self.mask_generation(self.acquired_image1).squeeze(1)
+        self.pattern = BinarizeFunction.apply(self.pattern)
+        self.pattern = pad_tensor(self.pattern, (131, 131))
+        self.cassi_system.pattern = self.pattern.to(self.device)
+
+        filtering_cube = self.cassi_system.generate_filtering_cube().to(self.device)
+        self.acquired_image2 = self.cassi_system.image_acquisition(hyperspectral_cube, self.pattern, wavelengths).to(self.device)
+
+
+        # self.acquired_image1 = self._normalize_data_by_itself(self.acquired_image1)
+        # acquired_cubes = self.acquired_image1.unsqueeze(1).repeat((1, 28, 1, 1)).float().to(self.device) # b x W x R x C
+
+        filtering_cubes = subsample(filtering_cube, torch.linspace(450, 650, filtering_cube.shape[-1]), torch.linspace(450, 650, 28)).permute((0, 3, 1, 2)).float().to(self.device)
+
+        if self.model_name == "birnat":
+            # acquisition = self.acquired_image1.unsqueeze(1)
+            acquisition = self.acquired_image2.float()
+            filtering_cubes = filtering_cubes.float()
+        elif "dauhst" in self.model_name:
+            acquisition = self.acquired_image2.float()
+            filtering_cubes_s = torch.sum(filtering_cubes**2,1)
+            filtering_cubes_s[filtering_cubes_s==0] = 1
+            filtering_cubes = (filtering_cubes.float(), filtering_cubes_s.float())
+
+        elif self.model_name == "mst_plus_plus":
+            acquisition = self.acquired_image2.unsqueeze(1).repeat((1, 28, 1, 1)).float().to(self.device)
+
+
+        reconstructed_cube = self.reconstruction_model(acquisition, filtering_cubes)
+
+
+        return reconstructed_cube
+
+
+    def training_step(self, batch, batch_idx):
+        print("Training step")
+
+        loss,reconstructed_cube, ref_cube = self._common_step(batch, batch_idx)
+
+
+
+        output_images = self._convert_output_to_images(self._normalize_image_tensor(self.acquired_image2))
+        patterns = self._convert_output_to_images(self._normalize_image_tensor(self.pattern))
+        input_images = self._convert_output_to_images(self._normalize_image_tensor(ref_cube[:,:,:,0]))
+        reconstructed_image = self._convert_output_to_images(self._normalize_image_tensor(reconstructed_cube[:,:,:,0]))
+
+        if self.global_step % 30 == 0:
+            self._log_images('train/acquisition2', output_images, self.global_step)
+            self._log_images('train/ground_truth', input_images, self.global_step)
+            self._log_images('train/reconstructed', reconstructed_image, self.global_step)
+            self._log_images('train/patterns', patterns, self.global_step)
+
+            plt.imshow(self.pattern[0,:,:].cpu().detach().numpy())
+            plt.colorbar()
+            plt.savefig('./pattern.png')
+
+            spectral_filter_plot = self.plot_spectral_filter(ref_cube,reconstructed_cube)
+            self.log_gradients(self.global_step)
+            self.writer.add_image('Spectral Filter', spectral_filter_plot, self.global_step)
+
+        self.log_dict(
+            { "train_loss": loss,
+            },
+            on_step=True,
+            on_epoch=True,
+            prog_bar=True,
+        )
+
+        return {"loss": loss}
+
+    def _normalize_image_tensor(self, tensor):
+        # Normalize the tensor to the range [0, 1]
+        min_val = tensor.min()
+        max_val = tensor.max()
+        normalized_tensor = (tensor - min_val) / (max_val - min_val)
+        return normalized_tensor
+
+    def validation_step(self, batch, batch_idx):
+
+        print("Validation step")
+        loss,reconstructed_cube, ref_cube= self._common_step(batch, batch_idx)
+
+        self.log_dict(
+            { "val_loss": loss,
+            },
+            on_step=True,
+            on_epoch=True,
+            prog_bar=True,
+        )
+
+        return {"loss": loss}
+
+    def test_step(self, batch, batch_idx):
+        print("Test step")
+        loss,reconstructed_cube, ref_cube= self._common_step(batch, batch_idx)
+        self.log_dict(
+            { "test_loss": loss,
+            },
+            on_step=True,
+            on_epoch=True,
+            prog_bar=True,
+        )
+        return {"loss": loss}
+
+    def predict_step(self, batch, batch_idx):
+        print("Predict step")
+        loss,reconstructed_cube, ref_cube= self._common_step(batch, batch_idx)
+        self.log('predict_step', loss,on_step=True, on_epoch=True, prog_bar=True, logger=True)
+        return loss
+
+    def _common_step(self, batch, batch_idx):
+
+
+        reconstructed_cube = self.forward(batch)
+        hyperspectral_cube, wavelengths = batch
+
+        hyperspectral_cube = hyperspectral_cube.permute(0, 2, 3, 1).to(self.device)
+        reconstructed_cube = reconstructed_cube.permute(0, 2, 3, 1).to(self.device)
+        ref_cube = match_dataset_to_instrument(hyperspectral_cube, reconstructed_cube[0, :, :,0])
+
+        # fig, ax = plt.subplots(1, 2)
+        # plt.title(f"true cube vs reconstructed cube")
+        # ax[0].imshow(hyperspectral_cube[0, :, :, 0].cpu().detach().numpy())
+        # ax[1].imshow(reconstructed_cube[0, :, :, 0].cpu().detach().numpy())
+        # plt.show()
+        total_sum_pattern = torch.sum(self.pattern, dim=(1, 2))
+        total_half_pattern_equal_1 = torch.sum(torch.ones_like(self.pattern), dim=(1, 2)) / 2
+
+        print(f"total_sum_pattern {total_sum_pattern}")
+        print(f"total_half_pattern_equal_1 {total_half_pattern_equal_1}")
+
+
+
+        loss1 = torch.sqrt(self.loss_fn(reconstructed_cube, ref_cube))
+        loss2 = torch.sum(torch.abs((total_sum_pattern - total_half_pattern_equal_1)/(self.pattern.shape[1]*self.pattern.shape[2]))**2)
+        loss = loss1 + loss2
+
+        print(f"loss1 {loss1}")
+        print(f"loss2 {loss2}")
+        return loss,reconstructed_cube, ref_cube
+
+    def configure_optimizers(self):
+        optimizer = torch.optim.Adam(self.parameters(), lr=4e-4)
+        return { "optimizer":optimizer,
+                "lr_scheduler":{
+                "scheduler":torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, 500, eta_min=1e-6),
+                "interval": "epoch"
+                }
+        }
+
+    def _log_images(self, tag, images, global_step):
+        # Convert model output to image grid and log to TensorBoard
+        img_grid = torchvision.utils.make_grid(images)
+        self.writer.add_image(tag, img_grid, global_step)
+
+    def _convert_output_to_images(self, acquired_images):
+
+        acquired_images = acquired_images.unsqueeze(1)
+
+        # Create a grid of images for visualization
+        img_grid = torchvision.utils.make_grid(acquired_images)
+        return img_grid
+
+    def log_gradients(self, step):
+        for name, param in self.mask_generation.named_parameters():
+            if param.grad is not None:
+                self.writer.add_scalar(f"Gradients/{name}", param.grad.norm(), step)
+
+
+    def plot_spectral_filter(self,ref_hyperspectral_cube,recontructed_hyperspectral_cube):
+
+
+        batch_size, y,x, lmabda_ = ref_hyperspectral_cube.shape
+
+        # Create a figure with subplots arranged horizontally
+        fig, axs = plt.subplots(1, batch_size, figsize=(batch_size * 5, 4))  # Adjust figure size as needed
+
+        # Check if batch_size is 1, axs might not be iterable
+        if batch_size == 1:
+            axs = [axs]
+
+        # Plot each spectral filter in its own subplot
+        for i in range(batch_size):
+            colors = ['b', 'g', 'r']
+            for j in range(3):
+                pix_j_row_value = np.random.randint(0,y)
+                pix_j_col_value = np.random.randint(0,x)
+
+                pix_j_ref = ref_hyperspectral_cube[i, pix_j_row_value,pix_j_col_value,:].cpu().detach().numpy()
+                pix_j_reconstructed = recontructed_hyperspectral_cube[i, pix_j_row_value,pix_j_col_value,:].cpu().detach().numpy()
+                axs[i].plot(pix_j_reconstructed, label="pix reconstructed" + str(j),c=colors[j])
+                axs[i].plot(pix_j_ref, label="pix" + str(j), linestyle='--',c=colors[j])
+
+            axs[i].set_title(f"Reconstruction quality")
+
+            axs[i].set_xlabel("Wavelength index")
+            axs[i].set_ylabel("pix values")
+            axs[i].grid(True)
+
+        plt.legend()
+        # Adjust layout
+        plt.tight_layout()
+
+        # Create a buffer to save plot
+        buf = io.BytesIO()
+        plt.savefig(buf, format='png')
+        plt.close(fig)
+        buf.seek(0)
+
+        # Convert PNG buffer to PIL Image
+        image = Image.open(buf)
+
+        # Convert PIL Image to Tensor
+        image_tensor = transforms.ToTensor()(image)
+        return image_tensor
+
+
+def subsample(input, origin_sampling, target_sampling):
+    [bs, row, col, nC] = input.shape
+    indices = torch.zeros(len(target_sampling), dtype=torch.int)
+    for i in range(len(target_sampling)):
+        sample = target_sampling[i]
+        idx = torch.abs(origin_sampling-sample).argmin()
+        indices[i] = idx
+    return input[:,:,:,indices]
+
+def expand_mask_3d(mask_batch):
+    if len(mask_batch.shape)==3:
+        mask3d = mask_batch.unsqueeze(-1).repeat((1, 1, 1, 28))
+    else:
+        mask3d = mask_batch.repeat((1, 1, 1, 28))
+    mask3d = torch.permute(mask3d, (0, 3, 1, 2))
+    return mask3d
+
+class EmptyModule(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.useless_linear = nn.Linear(1, 1)
+    def forward(self, x):
+        return x
+
+
+def pad_tensor(input_tensor, target_shape):
+    [bs, row, col] = input_tensor.shape
+    [target_row, target_col] = target_shape
+
+    # Calculate padding for rows
+    pad_row_total = max(target_row - row, 0)
+    pad_row_top = pad_row_total // 2
+    pad_row_bottom = pad_row_total - pad_row_top
+
+    # Calculate padding for columns
+    pad_col_total = max(target_col - col, 0)
+    pad_col_left = pad_col_total // 2
+    pad_col_right = pad_col_total - pad_col_left
+
+    # Apply padding
+    padded_tensor = F.pad(input_tensor, (pad_col_left, pad_col_right, pad_row_top, pad_row_bottom), 'constant', 0)
+    return padded_tensor
+
+def crop_tensor(input_tensor, target_shape):
+    [bs, row, col] = input_tensor.shape
+    [target_row, target_col] = target_shape
+    crop_row = (row-target_row)//2
+    crop_col = (col-target_col)//2
+    return input_tensor[:,crop_row:crop_row+target_row,crop_col:crop_col+target_col]
+
+# img = torch.randn(3, 112, 112)  # Example tensor
+# target_height = 128
+# target_width = 128
+#
+# plt.imshow(img[0,...].cpu().detach().numpy())
+# plt.show()
+#
+# zda = pad_tensor(img, (target_height, target_width))
+#
+# plt.imshow(zda[0,...].cpu().detach().numpy())
+# plt.show()
+
+
+class BinarizeFunction(torch.autograd.Function):
+    @staticmethod
+    def forward(ctx, input):
+        # Forward pass is the binary threshold operation
+        return (input > 0.5).float()
+
+    @staticmethod
+    def backward(ctx, grad_output):
+        # For backward pass, just pass the gradients through unchanged
+        return grad_output