Add files via upload

AlbertoFormaggio1 · web-flow · commit 446965ea97c3 · 2024-01-17T18:46:15.000+01:00
diff --git a/load_ds_histogram.py b/load_ds_histogram.py
@@ -0,0 +1,100 @@
+import torch
+import torchvision
+import torchvision.datasets as datasets
+from torchvision.transforms import v2
+from torch.utils.data import DataLoader
+from torchvision.datasets.folder import default_loader
+import cv2
+import numpy as np
+import os
+
+NUM_WORKERS = os.cpu_count()
+
+def create_dataloaders(train_path: str,
+                       test_path: str,
+                       batch_size: int,
+                       pre_proc_type: str,
+                       num_workers: int = NUM_WORKERS):
+
+    # Importing the datasets with imageFolder
+    train_ds = HistogramDataset(train_path, pre_proc_type)
+    test_ds = HistogramDataset(test_path, pre_proc_type)
+
+    # Creating the dataloaders
+    train_dataloader = DataLoader(train_ds, batch_size=batch_size, num_workers=num_workers, shuffle=True, pin_memory=True, drop_last=False)
+    test_dataloader = DataLoader(test_ds, batch_size=batch_size, num_workers=num_workers, shuffle=False, pin_memory=True, drop_last=False)
+
+    classes = train_ds.classes
+
+    return train_dataloader, test_dataloader, classes
+
+
+class HistogramDataset(torchvision.datasets.ImageFolder):
+    def __init__(self, root, preproc_type, loader=default_loader, is_valid_file=None):
+        super(HistogramDataset, self).__init__(root=root, loader=loader, is_valid_file=is_valid_file)
+        self.pre_proc_type = preproc_type
+
+    def __getitem__(self, index):
+        image_path, target = self.samples[index]
+        im = cv2.imread(image_path)
+
+        im_nonoise = cv2.GaussianBlur(im, (3, 3), 1)
+        if(self.pre_proc_type == 'lab' or self.pre_proc_type=='rgb'):
+            if(self.pre_proc_type == 'lab'):
+                prep_image = (im_nonoise * 1. / 255).astype(np.float32)
+                im_lab = cv2.cvtColor(prep_image, cv2.COLOR_BGR2LAB)
+            hist = calc_hists(im_lab, self.pre_proc_type)
+
+            # Setting up a matrix
+            hist = np.stack([h for h in hist], axis=-1)
+            # hist = np.stack([h for h in hist], axis=-1)
+            hist = np.squeeze(hist)
+
+            # Normalizing the vector with L2 normalization
+            norm = np.linalg.norm(hist)
+            norm_hist = hist / norm
+            # you need to convert img from np.array to torch.tensor
+            # this has to be done CAREFULLY!
+            sample = torchvision.transforms.ToTensor()(norm_hist)
+            return sample, target
+
+
+# Define a function to compute the histogram of the image (channel by channel)
+def calc_hists(img: np.ndarray, hist_type) -> list:
+    """
+    Calculates the histogram of the image (channel by channel).
+
+    Args:
+        img (numpy.ndarray): image to calculate the histogram
+
+    Returns:
+        list: list of histograms
+    """
+
+    assert img.ndim == 3, "The image must have 3 dimensions: (Height,Width,Channels)"
+
+    ch_1 = img[..., 0]
+    ch_2 = img[..., 1]
+    ch_3 = img[..., 2]
+
+    # Color image
+    if hist_type == 'rgb':
+        # Get the 3 channels
+        # Compute the histogram for each channel. Please, bear in mind that in the "Range" parameter, the upper bound is exclusive. So, for considering values in the range [0,255] we must pass [0,256]. https://docs.opencv.org/3.4/d8/dbc/tutorial_histogram_calculation.html
+        blue_hist = cv2.calcHist([ch_1], [0], None, [16], [0, 256])
+        red_hist = cv2.calcHist([ch_2], [0], None, [16], [0, 256])
+        green_hist = cv2.calcHist([ch_3], [0], None, [16], [0, 256])
+
+        return [blue_hist, green_hist, red_hist]
+    # Greyscale image
+    elif hist_type == 'lab':
+
+        L_hist = cv2.calcHist([ch_1], [0], None, [16], [0, 100])
+        a_hist = cv2.calcHist([ch_2], [0], None, [16], [-128, 128])
+        b_hist = cv2.calcHist([ch_3], [0], None, [16], [-128, 128])
+
+        return [L_hist, a_hist, b_hist]
+    else:
+        raise Exception("The image must have either 1 (greyscale image) or 3 (color image) channels")
+
+
diff --git a/model_mlp.py b/model_mlp.py
@@ -0,0 +1,15 @@
+import torch
+from torch import nn
+
+class MLP(torch.nn.Module):
+    def __init__(self, in_feature, hidden_size, num_classes):
+        super().__init__()
+        self.layer_1 = nn.Linear(in_features=in_feature, out_features=hidden_size)
+        self.layer_2 = nn.Linear(in_features=hidden_size, out_features=num_classes)
+
+    def forward(self, x):
+        x = nn.Flatten()(x)
+        x = self.layer_1(x)
+        x = nn.functional.relu(x)
+        x = self.layer_2(x)
+        return x
diff --git a/trainer_hist.py b/trainer_hist.py
@@ -0,0 +1,79 @@
+import torch, torchvision
+from torch import nn
+from torchvision import transforms
+import matplotlib.pyplot as plt
+import evaluate
+from torch.utils.tensorboard import SummaryWriter
+import engine
+import load_ds_histogram, model_mlp
+import os
+import re
+from pathlib import Path
+import warnings
+import argparse
+import datetime
+
+warnings.filterwarnings("ignore")
+
+
+parser = argparse.ArgumentParser()
+# These arguments will be set appropriately by ReCodEx, even if you change them.
+parser.add_argument("--batch_size", default=16, type=int, help="Batch size.")
+parser.add_argument('--epochs', default=30, type=int, help="Epochs.")
+parser.add_argument('--learning_rate', default=0.1, type=float, help="Learning rate.")
+parser.add_argument('--label_smoothing', default=0.1, type=float, help='Label smoothing.')
+parser.add_argument('--preproc_type', default='lab', type=str, choices=['lab', 'rgb'], help='Type of preprocessing')
+parser.add_argument('--hidden_size', default=32, type=int, help='Number of hidden neurons in the MLP')
+parser.add_argument('--only_inference', default=True, type=bool, help='Number of hidden neurons in the MLP')
+
+def main(args: argparse.Namespace):
+    args.logdir = os.path.join("logs", "{}-{}-{}".format(
+        os.path.basename(globals().get("__file__", "notebook")),
+        datetime.datetime.now().strftime("%Y-%m-%d_%H%M%S"),
+        ",".join(("{}={}".format(re.sub("(.)[^_]*_?", r"\1", k), v) for k, v in sorted(vars(args).items())))
+    ))
+
+
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+
+    data_path = Path('syndrone')
+    train_path = data_path / 'train'
+    test_path = data_path / 'test'
+
+    train_dataloader, test_dataloader, classes = load_ds_histogram.create_dataloaders(train_path, test_path, args.batch_size, args.preproc_type)
+
+    mlp = model_mlp.MLP(16 * 3, args.hidden_size, len(classes))
+
+    loss_fn = nn.CrossEntropyLoss(label_smoothing=args.label_smoothing)
+    optimizer = torch.optim.SGD(mlp.parameters(), lr=args.learning_rate)
+
+    writer = SummaryWriter(log_dir=args.logdir)
+
+    # Generate the metrics
+    clf_metrics = {'precision': evaluate.load("precision"),
+                   'recall': evaluate.load("recall"),
+                   'f1': evaluate.load("f1"),
+                   'accuracy': evaluate.load("accuracy")}
+
+
+    if (not args.only_inference):
+        engine.train(mlp, train_dataloader, test_dataloader, optimizer, loss_fn, args.epochs, device, clf_metrics, 0, writer, 'mlp',args.logdir)
+
+    mlp.load_state_dict(torch.load(str(f'{args.logdir}/model.pth')))
+
+    # Now test on UAVid
+    data_path = Path('UAVid')
+    train_path = data_path / 'train'
+    test_path = data_path / 'test'
+
+    train_dataloader, test_dataloader, classes = load_ds_histogram.create_dataloaders(train_path, test_path, args.batch_size, args.preproc_type)
+
+    results = engine.test_step(mlp, test_dataloader, loss_fn, device, clf_metrics)
+
+    for k, v in results.items():
+        writer.add_scalar(f'test/{k}', v, 1)
+
+
+if __name__ == "__main__":
+    args = parser.parse_args([] if "__file__" not in globals() else None)
+    main(args)