VectorInstitute · sanaAyrml · Jan 24, 2024 · Jan 25, 2024 · Jan 26, 2024 · Jan 26, 2024
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -40,15 +40,6 @@ repos:
       - id: nbqa-ruff
         args: [--fix]
 
-  - repo: local
-    hooks:
-    - id: pytest
-      name: pytest
-      entry: python3 -m pytest
-      language: system
-      pass_filenames: false
-      always_run: true
-
 exclude: |
   (?x)(
       ^rcdm/|

diff --git a/.../data_aug/contrastive_learning_dataset.py → .../datasets/contrastive_learning_dataset.py b/.../data_aug/contrastive_learning_dataset.py → .../datasets/contrastive_learning_dataset.py
@@ -1,11 +1,11 @@
 from torchvision import datasets, transforms
 
-from SimCLR.data_aug.gaussian_blur import GaussianBlur
-from SimCLR.data_aug.icgan_aug import ICGANInference
-from SimCLR.data_aug.icgan_config import get_icgan_config
-from SimCLR.data_aug.rcdm_aug import RCDMInference
-from SimCLR.data_aug.rcdm_config import get_config
-from SimCLR.data_aug.view_generator import ContrastiveLearningViewGenerator
+from SimCLR.datasets.data_aug.gaussian_blur import GaussianBlur
+from SimCLR.datasets.data_aug.icgan_aug import ICGANInference
+from SimCLR.datasets.data_aug.icgan_config import get_icgan_config
+from SimCLR.datasets.data_aug.rcdm_aug import RCDMInference
+from SimCLR.datasets.data_aug.rcdm_config import get_config
+from SimCLR.datasets.view_generator import ContrastiveLearningViewGenerator
 from SimCLR.exceptions.exceptions import InvalidDatasetSelection
 
 
@@ -114,3 +114,4 @@ def get_dataset(
             raise InvalidDatasetSelection()
         else:
             return dataset_fn()
+
diff --git a/SimCLR/datasets/data_aug/center_crop.py b/SimCLR/datasets/data_aug/center_crop.py
@@ -0,0 +1,44 @@
+import torch.nn.functional as F
+import torchvision
+import torch
+
+class CostumeCenterCrop(torch.nn.Module):
+    def __init__(self, size=None, ratio="1:1"):
+        super().__init__()
+        self.size = size
+        self.ratio = ratio
+    def forward(self, img):
+        """
+        Args:
+            img (PIL Image or Tensor): Image to be cropped.
+
+        Returns:
+            PIL Image or Tensor: Cropped image.
+        """
+        if self.size is None:
+            if isinstance(img, torch.Tensor):
+                h, w = img.shape[-2:]
+            else:
+                w, h = img.size
+            ratio = self.ratio.split(":")
+            ratio = float(ratio[0]) / float(ratio[1])
+            # Size must match the ratio while cropping to the edge of the image
+            ratioed_w = int(h * ratio)
+            ratioed_h = int(w / ratio)
+            if w>=h:
+                if ratioed_h <= h:
+                    size = (ratioed_h, w)
+                else:
+                    size = (h, ratioed_w)
+            else:
+                if ratioed_w <= w:
+                    size = (h, ratioed_w)
+                else:
+                    size = (ratioed_h, w)
+        else:
+            size = self.size
+        return torchvision.transforms.functional.center_crop(img, size)
+
+    def __repr__(self) -> str:
+        return f"{self.__class__.__name__}(size={self.size})"
+
diff --git a/SimCLR/data_aug/gaussian_blur.py → SimCLR/datasets/data_aug/gaussian_blur.py b/SimCLR/data_aug/gaussian_blur.py → SimCLR/datasets/data_aug/gaussian_blur.py
diff --git a/SimCLR/data_aug/icgan_aug.py → SimCLR/datasets/data_aug/icgan_aug.py b/SimCLR/data_aug/icgan_aug.py → SimCLR/datasets/data_aug/icgan_aug.py
diff --git a/SimCLR/data_aug/icgan_config.py → SimCLR/datasets/data_aug/icgan_config.py b/SimCLR/data_aug/icgan_config.py → SimCLR/datasets/data_aug/icgan_config.py
diff --git a/SimCLR/data_aug/rcdm_aug.py → SimCLR/datasets/data_aug/rcdm_aug.py b/SimCLR/data_aug/rcdm_aug.py → SimCLR/datasets/data_aug/rcdm_aug.py
@@ -21,7 +21,7 @@ def __init__(self, config, device_id):
 
         # Load SSL model
         self.ssl_model = (
-            get_model(self.config.type_model, self.config.use_head)
+            get_model(self.config.type_model, self.config.use_head, self.config.pretrained_models_dir)
             .cuda(self.device_id)
             .eval()
         )
@@ -50,7 +50,7 @@ def __init__(self, config, device_id):
 
         if self.config.model_path == "":
             trained_model = get_dict_rcdm_model(
-                self.config.type_model, self.config.use_head
+                self.config.type_model, self.config.use_head, self.config.pretrained_models_dir
             )
         else:
             trained_model = torch.load(self.config.model_path, map_location="cpu")
@@ -63,7 +63,6 @@ def preprocess_input_image(self, input_image, size=224):
                 data_utils.CenterCropLongEdge(),
                 transforms.Resize((size, size)),
                 transforms.ToTensor(),
-                transforms.Normalize(self.config.norm_mean, self.config.norm_std),
             ]
         )
         tensor_image = transform_list(input_image)
@@ -89,9 +88,8 @@ def __call__(self, img):
             if not self.config.use_ddim
             else self.diffusion.ddim_sample_loop
         )
-
-        img = img.unsqueeze(0).repeat(1, 1, 1, 1)
         img = self.preprocess_input_image(img).cuda(self.device_id)
+        img = img.repeat(1, 1, 1, 1)
         model_kwargs = {}
 
         with torch.no_grad():
@@ -104,5 +102,4 @@ def __call__(self, img):
             model_kwargs=model_kwargs,
         )
 
-        print("Sampling completed!")
         return sample.squeeze(0)
diff --git a/SimCLR/data_aug/rcdm_config.py → SimCLR/datasets/data_aug/rcdm_config.py b/SimCLR/data_aug/rcdm_config.py → SimCLR/datasets/data_aug/rcdm_config.py
@@ -1,29 +1,31 @@
-import ml_collections
-
-
-def get_config():
-    config = ml_collections.ConfigDict()
-    config.image_size = 128  # The size of the images to generate.
-    config.class_cond = False  # If true, use class conditional generation.
-    config.type_model = "simclr"  # Type of model to use (e.g., simclr, dino).
-    config.use_head = False  # If true, use the projector/head for SSL representation.
-    config.model_path = ""  # Replace with the path to your model if you have one.
-    config.use_ddim = False  # If true, use DDIM sampler.
-    config.no_shared = True  # If false, enables squeeze and excitation.
-    config.clip_denoised = True  # If true, clip denoised images.
-    config.attention_resolutions = "32,16,8"  # Resolutions to use for attention layers.
-    config.diffusion_steps = 100  # Number of diffusion steps.
-    config.learn_sigma = True  # If true, learn the noise level.
-    config.noise_schedule = "linear"  # Type of noise schedule (e.g., linear).
-    config.num_channels = 256  # Number of channels in the model.
-    config.num_heads = 4  # Number of attention heads.
-    config.num_res_blocks = 2  # Number of residual blocks.
-    config.resblock_updown = True  # If true, use up/down sampling in resblocks.
-    config.use_fp16 = False  # If true, use 16-bit floating point precision.
-    config.use_scale_shift_norm = True  # If true, use scale-shift normalization.
-    config.ssl_image_size = 224  # Size of the input images for the SSL model.
-    config.ssl_image_channels = (
-        3  # Number of channels of the input images for the SSL model.
-    )
-
-    return config
+import ml_collections
+
+
+def get_config():
+    config = ml_collections.ConfigDict()
+    config.image_size = 128  # The size of the images to generate.
+    config.class_cond = False  # If true, use class conditional generation.
+    config.pretrained_models_dir  = "/ssd003/projects/aieng/genssl" # Path to the directory containing the model.
+    config.type_model = "simclr"  # Type of model to use (e.g., simclr, dino).
+    config.use_head = False  # If true, use the projector/head for SSL representation.
+    config.model_path = ""  # Replace with the path to your model if you have one.
+    config.use_ddim = True  # If true, use DDIM sampler.
+    config.no_shared = True  # If false, enables squeeze and excitation.
+    config.clip_denoised = True  # If true, clip denoised images.
+    config.attention_resolutions = "32,16,8"  # Resolutions to use for attention layers.
+    config.diffusion_steps = 100  # Number of diffusion steps.
+    config.learn_sigma = True  # If true, learn the noise level.
+    config.noise_schedule = "linear"  # Type of noise schedule (e.g., linear).
+    config.num_channels = 256  # Number of channels in the model.
+    config.num_heads = 4  # Number of attention heads.
+    config.num_res_blocks = 2  # Number of residual blocks.
+    config.resblock_updown = True  # If true, use up/down sampling in resblocks.
+    config.use_fp16 = False  # If true, use 16-bit floating point precision.
+    config.use_scale_shift_norm = True  # If true, use scale-shift normalization.
+    config.ssl_image_size = 224  # Size of the input images for the SSL model.
+    config.ssl_image_channels = (
+        3  # Number of channels of the input images for the SSL model.
+    )
+    config.timestep_respacing = "ddim2" # Type of timestep respacing (e.g., ddim25).
+
+    return config
diff --git a/SimCLR/datasets/supervised_dataset.py b/SimCLR/datasets/supervised_dataset.py
@@ -0,0 +1,57 @@
+from torchvision import datasets, transforms
+from torchvision.transforms import transforms
+
+from SimCLR.exceptions.exceptions import InvalidDatasetSelection
+from SimCLR.datasets.data_aug.center_crop import CostumeCenterCrop
+
+class SupervisedDataset:
+    def __init__(self, root_folder):
+        self.root_folder = root_folder
+
+    @staticmethod
+    def get_transform(size):
+        """Return a set of simple transformations for supervised learning.
+
+        Args:
+            size (int): Image size.
+        """
+        transform_list = [
+            CostumeCenterCrop(),
+            transforms.Resize((size, size)),
+            transforms.ToTensor(),
+        ]
+
+        return transforms.Compose(transform_list)
+
+
+    def get_dataset(self, name, train = True):
+        if name == "imagenet":
+            if train:
+                split = "train"
+            else:
+                split = "val"
+            return datasets.ImageNet(
+                self.root_folder,
+                split=split,
+                transform=self.get_transform(224),
+            )
+        elif name == "cifar10":
+            return datasets.CIFAR10(
+                self.root_folder,
+                train=train,
+                transform= self.get_transform(32),
+                download=True,
+            )
+        elif name == "stl10":
+            if train:
+                split = "train"
+            else:
+                split = "test"
+            return datasets.STL10(
+                self.root_folder,
+                split=split,
+                transform=self.get_transform(96),
+                download=True,
+            )
+        else:
+            raise InvalidDatasetSelection()
diff --git a/SimCLR/data_aug/view_generator.py → SimCLR/datasets/view_generator.py b/SimCLR/data_aug/view_generator.py → SimCLR/datasets/view_generator.py
diff --git a/SimCLR/models/resnet_pretrained.py b/SimCLR/models/resnet_pretrained.py
@@ -0,0 +1,64 @@
+import torch
+from torch import nn
+from torchvision import models
+
+from ..exceptions.exceptions import InvalidBackboneError
+
+
+class PretrainedResNet(nn.Module):
+    def __init__(self, base_model, pretrained_model_file, linear_eval=True, num_classes=10):
+        super(PretrainedResNet, self).__init__()
+
+        self.pretrained_model_file = pretrained_model_file
+
+        self.resnet_dict = {
+            "resnet18": models.resnet18(pretrained=False, num_classes=num_classes),
+            "resnet50": models.resnet50(pretrained=False, num_classes=num_classes),
+        }
+
+        self.backbone = self._get_basemodel(base_model)
+
+        # load pretrained weights
+        log = self._load_pretrained()
+
+        assert log.missing_keys == ["fc.weight", "fc.bias"]
+
+        if linear_eval:
+            # freeze all layers but the last fc
+            self._freeze_backbone()
+            parameters = list(filter(lambda p: p.requires_grad, self.backbone.parameters()))
+            assert len(parameters) == 2  # fc.weight, fc.bias
+
+    def _load_pretrained(self):
+        checkpoint = torch.load(self.pretrained_model_file, map_location='cpu')
+        state_dict = checkpoint["state_dict"]
+        for k in list(state_dict.keys()):
+            if k.startswith("module.backbone."):
+                if not k.startswith("module.backbone.fc"):
+                    # remove prefix
+                    state_dict[k[len("module.backbone.") :]] = state_dict[k]
+            del state_dict[k]
+        log = self.backbone.load_state_dict(state_dict, strict=False)
+        return log
+
+
+    def _freeze_backbone(self):
+        # freeze all layers but the last fc
+        for name, param in self.backbone.named_parameters():
+            if name not in ["fc.weight", "fc.bias"]:
+                param.requires_grad = False
+        return
+
+
+    def _get_basemodel(self, model_name):
+        try:
+            model = self.resnet_dict[model_name]
+        except KeyError:
+            raise InvalidBackboneError(
+                "Invalid backbone architecture. Check the config file and pass one of: resnet18 or resnet50",
+            )
+        else:
+            return model
+
+    def forward(self, x):
+        return self.backbone(x)
diff --git a/SimCLR/simclr.py b/SimCLR/simclr.py
@@ -1,4 +1,5 @@
 import os
+from datetime import datetime
 
 import torch
 from torch.cuda.amp import GradScaler, autocast
@@ -18,7 +19,15 @@ def __init__(self, *args, **kwargs):
         self.optimizer = kwargs["optimizer"]
         self.scheduler = kwargs["scheduler"]
         self.device_id = kwargs["device_id"]
-        self.writer = SummaryWriter()
+        # Create a directory to save the model checkpoints and logs
+        now = datetime.now()
+        dt_string = now.strftime("%Y_%m_%d_%H_%M")
+        log_dir = os.path.join(args.model_dir, args.experiment_name,dt_string)
+        try:
+            os.makedirs(log_dir)
+        except FileExistsError:
+            print(f"Directory {log_dir} made by another worker", flush=True)
+        self.writer = SummaryWriter(log_dir)
         self.criterion = loss.SimCLRContrastiveLoss(self.args.temperature).cuda(
             self.device_id
         )
@@ -62,7 +71,6 @@ def train(self, train_loader):
                         self.scheduler.get_last_lr()[0],
                         global_step=n_iter,
                     )
-
                 n_iter += 1
 
             # warmup for the first 10 epochs

diff --git a/eval_simclr.slrm b/eval_simclr.slrm
@@ -0,0 +1,51 @@
+#!/bin/bash
+
+#SBATCH --job-name=train_sunrgbd
+#SBATCH --partition=t4v2
+#SBATCH --nodes=1
+#SBATCH --gres=gpu:4
+#SBATCH --ntasks-per-node=4
+#SBATCH --cpus-per-task=4
+#SBATCH --mem=100G
+#SBATCH --output=logs/simclr/eval_slurm-%N-%j.out
+#SBATCH --error=logs/simclr/eval_slurm-%N-%j.err
+#SBATCH --qos=m
+
+PY_ARGS=${@:1}
+
+# load virtual environment
+source /ssd003/projects/aieng/envs/genssl2/bin/activate
+
+export TORCH_NCCL_ASYNC_ERROR_HANDLING=1 # set to 1 for NCCL backend
+export CUDA_LAUNCH_BLOCKING=1
+
+export MASTER_ADDR=$(hostname)
+export MASTER_PORT=45679
+
+export PYTHONPATH="."
+nvidia-smi
+
+pretrained_model_dir="/projects/imagenet_synthetic/train_models"
+experiment_name="simclr/2024_02_23_13_02"
+
+cd $pretrained_model_dir/$experiment_name
+
+files=$(ls checkpoint_epoch_*)
+
+cd "$OLDPWD"
+
+# Loop through each file and pass it as a parameter to the rest of the script
+for file in $files
+do
+    echo "Evaluating: $file"
+
+    # srun execute ntasks-per-node * nodes times
+    srun python evaluate_simCLR.py \
+    --distributed_mode \
+    --batch-size=256 \
+    --pretrained_model_dir=$pretrained_model_dir \
+    --experiment_name=$experiment_name \
+    --pretrained_model_name=$file \
+    --linear_evaluation 
+    # Add your processing logic here
+done