implement dataset for classification

Duftata · Duftata · commit 0684b69ac566 · 2024-10-15T10:02:40.000+02:00
diff --git a/dataset/create_cv_splits.ipynb b/dataset/create_cv_splits.ipynb
@@ -6,8 +6,8 @@
    "metadata": {
     "collapsed": true,
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:43.618315Z",
-     "start_time": "2024-10-14T16:42:43.563966Z"
+     "end_time": "2024-10-15T06:54:10.123002Z",
+     "start_time": "2024-10-15T06:54:10.078224Z"
     }
    },
    "source": [
@@ -25,8 +25,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:43.633543Z",
-     "start_time": "2024-10-14T16:42:43.619411Z"
+     "end_time": "2024-10-15T06:54:10.138779Z",
+     "start_time": "2024-10-15T06:54:10.123985Z"
     }
    },
    "cell_type": "code",
@@ -74,8 +74,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:43.644170Z",
-     "start_time": "2024-10-14T16:42:43.634252Z"
+     "end_time": "2024-10-15T06:54:10.146829Z",
+     "start_time": "2024-10-15T06:54:10.139469Z"
     }
    },
    "cell_type": "code",
@@ -116,8 +116,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:43.653869Z",
-     "start_time": "2024-10-14T16:42:43.645037Z"
+     "end_time": "2024-10-15T06:54:10.168041Z",
+     "start_time": "2024-10-15T06:54:10.147523Z"
     }
    },
    "cell_type": "code",
@@ -137,8 +137,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.314722Z",
-     "start_time": "2024-10-14T16:42:43.654562Z"
+     "end_time": "2024-10-15T06:54:10.837962Z",
+     "start_time": "2024-10-15T06:54:10.169054Z"
     }
    },
    "cell_type": "code",
@@ -156,8 +156,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.320170Z",
-     "start_time": "2024-10-14T16:42:44.315638Z"
+     "end_time": "2024-10-15T06:54:10.842454Z",
+     "start_time": "2024-10-15T06:54:10.838968Z"
     }
    },
    "cell_type": "code",
@@ -181,8 +181,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.353884Z",
-     "start_time": "2024-10-14T16:42:44.320776Z"
+     "end_time": "2024-10-15T06:54:10.876290Z",
+     "start_time": "2024-10-15T06:54:10.843525Z"
     }
    },
    "cell_type": "code",
@@ -217,8 +217,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.358482Z",
-     "start_time": "2024-10-14T16:42:44.354677Z"
+     "end_time": "2024-10-15T06:54:10.881895Z",
+     "start_time": "2024-10-15T06:54:10.877157Z"
     }
    },
    "cell_type": "code",
@@ -253,8 +253,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.549793Z",
-     "start_time": "2024-10-14T16:42:44.359164Z"
+     "end_time": "2024-10-15T06:54:11.074822Z",
+     "start_time": "2024-10-15T06:54:10.883094Z"
     }
    },
    "cell_type": "code",
@@ -291,8 +291,8 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.560169Z",
-     "start_time": "2024-10-14T16:42:44.550715Z"
+     "end_time": "2024-10-15T06:54:11.090284Z",
+     "start_time": "2024-10-15T06:54:11.076120Z"
     }
    },
    "cell_type": "code",
@@ -447,23 +447,22 @@
   {
    "metadata": {
     "ExecuteTime": {
-     "end_time": "2024-10-14T16:42:44.633875Z",
-     "start_time": "2024-10-14T16:42:44.560756Z"
+     "end_time": "2024-10-15T06:54:11.156047Z",
+     "start_time": "2024-10-15T06:54:11.091264Z"
     }
    },
    "cell_type": "code",
    "source": [
-    "print('Known classes:', df_exploded['ao_classification'].unique())\n",
-    "df_split.to_csv('/home/ron/Documents/AOClassification/data/dataset_cv_splits.csv', index=False)"
+    "print('Known classes:', sorted(df_exploded['ao_classification'].unique()))\n",
+    "df_split.to_csv('/home/ron/Documents/AOClassification/data/dataset_cv_splits.csv', index=False, mode='x')"
    ],
    "id": "50fdb4a84921dec8",
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Known classes: ['23r-M/2.1' '23-M/3.1' 'none' '23-M/2.1' '23u-E/7' '23r-E/2.1'\n",
-      " '23r-M/3.1' '23u-M/2.1']\n"
+      "Known classes: ['23-M/2.1', '23-M/3.1', '23r-E/2.1', '23r-M/2.1', '23r-M/3.1', '23u-E/7', '23u-M/2.1', 'none']\n"
      ]
     }
    ],
diff --git a/dataset/grazpedwri_dataset.py b/dataset/grazpedwri_dataset.py
@@ -0,0 +1,129 @@
+import logging
+from pathlib import Path
+from typing import Any
+
+import pandas as pd
+import torch
+from PIL import Image
+from kornia.enhance import Normalize
+from pytorch_lightning import LightningDataModule
+from torch.utils.data import Dataset
+from torchvision.transforms.functional import to_tensor
+from tqdm import tqdm
+
+
+class GrazPedWriDataset(Dataset):
+    # calculated over training split
+    IMG_MEAN = 0.3505533917353781
+    IMG_STD = 0.22763733675869177
+
+    RESCALE_HW = (384, 224)
+
+    CLASS_LABEL = ['23-M/2.1', '23-M/3.1', '23r-E/2.1', '23r-M/2.1', '23r-M/3.1', '23u-E/7', '23u-M/2.1', 'none']
+    CLASS_IDX = {k: v for v, k in enumerate(CLASS_LABEL)}
+    N_CLASSES = len(CLASS_LABEL)
+
+    def __init__(self, mode: str, fold: int = 0, number_training_samples: int | str = 'all'):
+        super().__init__()
+        # load data meta and other information
+        self.df_meta = pd.read_csv('data/dataset_cv_splits.csv', index_col='filestem')
+        # init ground truth parser considering the data split
+        if mode == 'train':
+            self.df_meta = self.df_meta[self.df_meta['fold'] != fold]
+        elif mode == 'val':
+            self.df_meta = self.df_meta[self.df_meta['fold'] == fold]
+        else:
+            raise ValueError(f'Unknown mode: {mode}')
+        self.available_file_names = self.df_meta.index.tolist()
+
+        # get subset of training samples
+        if mode == 'train' and number_training_samples != 'all':
+            raise NotImplementedError('number_training_samples is not implemented for GrazPedWriDataset')
+        elif mode != 'train' and number_training_samples != 'all':
+            logging.warning(f'number_training_samples is not used for mode {mode}')
+
+        # load img into memory
+        img_path = Path('data/img_only_front_all_left')
+        self.data = dict()
+        for file_name in tqdm(self.available_file_names, unit='img', desc=f'Loading data for {mode}'):
+            # image
+            img = Image.open(img_path.joinpath(file_name).with_suffix('.png')).convert('L')
+            img = img.resize(self.RESCALE_HW[::-1], Image.BILINEAR)
+            img = to_tensor(img)
+
+            # classification ground truth
+            class_label: str = self.df_meta.loc[file_name, 'ao_classification']
+            class_label: list[str] = class_label.split(';')
+            y = torch.zeros(self.N_CLASSES)
+            for c in class_label:
+                c = c.strip()
+                if c not in self.CLASS_IDX:
+                    continue
+                else:
+                    y[self.CLASS_IDX[c]] = 1
+            assert y.sum() > 0, f'No valid class found for {file_name} with {class_label}'
+
+            self.data[file_name] = {
+                'file_name': file_name,
+                'image': img,
+                'y': y
+
+            }
+            break
+
+    def __len__(self):
+        return len(self.available_file_names)
+
+    def __getitem__(self, index):
+        """
+        get item by index
+        :param index: index of item
+        :return: dict with keys ['image', 'mask', 'file_name']
+        """
+        file_name = self.available_file_names[index]
+        data_dict = self.data[file_name]
+
+        return data_dict
+
+
+class GrazPedWriDataModule(LightningDataModule):
+    def __init__(self, fold: int = 0, batch_size: int = 32, number_training_samples: int | str = 'all'):
+        super().__init__()
+        self.n_train = number_training_samples
+        self.fold = fold
+        self.dl_kwargs = {'batch_size': batch_size, 'num_workers': 4, 'pin_memory': torch.cuda.is_available()}
+        self.normalize = Normalize(mean=GrazPedWriDataset.IMG_MEAN, std=GrazPedWriDataset.IMG_STD)
+
+    def setup(self, stage: str = None):
+        if stage == 'fit' or stage is None:
+            self.train_dataset = GrazPedWriDataset('train', self.fold, self.n_train)
+            self.val_dataset = GrazPedWriDataset('val', self.fold)
+        if stage == 'test' or stage is None:
+            self.test_dataset = GrazPedWriDataset('val', self.fold)
+
+    def train_dataloader(self):
+        return torch.utils.data.DataLoader(self.train_dataset, shuffle=True, drop_last=True, **self.dl_kwargs)
+
+    def val_dataloader(self):
+        return torch.utils.data.DataLoader(self.val_dataset, **self.dl_kwargs)
+
+    def test_dataloader(self):
+        return torch.utils.data.DataLoader(self.test_dataset, **self.dl_kwargs)
+
+    def on_after_batch_transfer(self, batch: Any, dataloader_idx: int) -> Any:
+        batch['image'] = self.normalize(batch['image'])
+        return batch
+
+
+if __name__ == '__main__':
+    import matplotlib.pyplot as plt
+    from torch.utils.data import DataLoader
+
+    dataset = GrazPedWriDataset('val', fold=0)
+    data = dataset[0]
+    print(data['image'].shape)
+    print(data['y'])
+    plt.figure(data['file_name'])
+    plt.imshow(data['image'].squeeze().numpy(), cmap='gray')
+    plt.title(dataset.CLASS_LABEL[data['y'].argmax()])
+    plt.show()