arnabGudu
diff --git a/‎.gitignore
+4-3 b/‎.gitignore
+4-3
diff --git a/‎LICENSE
+201-201 b/‎LICENSE
+201-201
diff --git a/‎README.md
+123-123 b/‎README.md
+123-123
diff --git a/‎TRAIN-ON-CUSTOM-DATASET.md
+75-75 b/‎TRAIN-ON-CUSTOM-DATASET.md
+75-75
diff --git a/‎datasets/coco.py
+179-179 b/‎datasets/coco.py
+179-179
@@ -1,3 +1,4 @@
-*.pyc
-__pycache__
-.idea/
+*.pyc
+__pycache__
+.idea/
+checkpoints
@@ -1,179 +1,179 @@
-import copy
-import json
-import math
-import os
-import pickle
-
-import cv2
-import numpy as np
-import pycocotools
-
-from torch.utils.data.dataset import Dataset
-
-BODY_PARTS_KPT_IDS = [[1, 8], [8, 9], [9, 10], [1, 11], [11, 12], [12, 13], [1, 2], [2, 3], [3, 4], [2, 16],
-                      [1, 5], [5, 6], [6, 7], [5, 17], [1, 0], [0, 14], [0, 15], [14, 16], [15, 17]]
-
-
-def get_mask(segmentations, mask):
-    for segmentation in segmentations:
-        rle = pycocotools.mask.frPyObjects(segmentation, mask.shape[0], mask.shape[1])
-        mask[pycocotools.mask.decode(rle) > 0.5] = 0
-    return mask
-
-
-class CocoTrainDataset(Dataset):
-    def __init__(self, labels, images_folder, stride, sigma, paf_thickness, transform=None):
-        super().__init__()
-        self._images_folder = images_folder
-        self._stride = stride
-        self._sigma = sigma
-        self._paf_thickness = paf_thickness
-        self._transform = transform
-        with open(labels, 'rb') as f:
-            self._labels = pickle.load(f)
-
-    def __getitem__(self, idx):
-        label = copy.deepcopy(self._labels[idx])  # label modified in transform
-        image = cv2.imread(os.path.join(self._images_folder, label['img_paths']), cv2.IMREAD_COLOR)
-        mask = np.ones(shape=(label['img_height'], label['img_width']), dtype=np.float32)
-        mask = get_mask(label['segmentations'], mask)
-        sample = {
-            'label': label,
-            'image': image,
-            'mask': mask
-        }
-        if self._transform:
-            sample = self._transform(sample)
-
-        mask = cv2.resize(sample['mask'], dsize=None, fx=1/self._stride, fy=1/self._stride, interpolation=cv2.INTER_AREA)
-        keypoint_maps = self._generate_keypoint_maps(sample)
-        sample['keypoint_maps'] = keypoint_maps
-        keypoint_mask = np.zeros(shape=keypoint_maps.shape, dtype=np.float32)
-        for idx in range(keypoint_mask.shape[0]):
-            keypoint_mask[idx] = mask
-        sample['keypoint_mask'] = keypoint_mask
-
-        paf_maps = self._generate_paf_maps(sample)
-        sample['paf_maps'] = paf_maps
-        paf_mask = np.zeros(shape=paf_maps.shape, dtype=np.float32)
-        for idx in range(paf_mask.shape[0]):
-            paf_mask[idx] = mask
-        sample['paf_mask'] = paf_mask
-
-        image = sample['image'].astype(np.float32)
-        image = (image - 128) / 256
-        sample['image'] = image.transpose((2, 0, 1))
-        del sample['label']
-        return sample
-
-    def __len__(self):
-        return len(self._labels)
-
-    def _generate_keypoint_maps(self, sample):
-        n_keypoints = 18
-        n_rows, n_cols, _ = sample['image'].shape
-        keypoint_maps = np.zeros(shape=(n_keypoints + 1,
-                                        n_rows // self._stride, n_cols // self._stride), dtype=np.float32)  # +1 for bg
-
-        label = sample['label']
-        for keypoint_idx in range(n_keypoints):
-            keypoint = label['keypoints'][keypoint_idx]
-            if keypoint[2] <= 1:
-                self._add_gaussian(keypoint_maps[keypoint_idx], keypoint[0], keypoint[1], self._stride, self._sigma)
-            for another_annotation in label['processed_other_annotations']:
-                keypoint = another_annotation['keypoints'][keypoint_idx]
-                if keypoint[2] <= 1:
-                    self._add_gaussian(keypoint_maps[keypoint_idx], keypoint[0], keypoint[1], self._stride, self._sigma)
-        keypoint_maps[-1] = 1 - keypoint_maps.max(axis=0)
-        return keypoint_maps
-
-    def _add_gaussian(self, keypoint_map, x, y, stride, sigma):
-        n_sigma = 4
-        tl = [int(x - n_sigma * sigma), int(y - n_sigma * sigma)]
-        tl[0] = max(tl[0], 0)
-        tl[1] = max(tl[1], 0)
-
-        br = [int(x + n_sigma * sigma), int(y + n_sigma * sigma)]
-        map_h, map_w = keypoint_map.shape
-        br[0] = min(br[0], map_w * stride)
-        br[1] = min(br[1], map_h * stride)
-
-        shift = stride / 2 - 0.5
-        for map_y in range(tl[1] // stride, br[1] // stride):
-            for map_x in range(tl[0] // stride, br[0] // stride):
-                d2 = (map_x * stride + shift - x) * (map_x * stride + shift - x) + \
-                    (map_y * stride + shift - y) * (map_y * stride + shift - y)
-                exponent = d2 / 2 / sigma / sigma
-                if exponent > 4.6052:  # threshold, ln(100), ~0.01
-                    continue
-                keypoint_map[map_y, map_x] += math.exp(-exponent)
-                if keypoint_map[map_y, map_x] > 1:
-                    keypoint_map[map_y, map_x] = 1
-
-    def _generate_paf_maps(self, sample):
-        n_pafs = len(BODY_PARTS_KPT_IDS)
-        n_rows, n_cols, _ = sample['image'].shape
-        paf_maps = np.zeros(shape=(n_pafs * 2, n_rows // self._stride, n_cols // self._stride), dtype=np.float32)
-
-        label = sample['label']
-        for paf_idx in range(n_pafs):
-            keypoint_a = label['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][0]]
-            keypoint_b = label['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][1]]
-            if keypoint_a[2] <= 1 and keypoint_b[2] <= 1:
-                self._set_paf(paf_maps[paf_idx * 2:paf_idx * 2 + 2],
-                              keypoint_a[0], keypoint_a[1], keypoint_b[0], keypoint_b[1],
-                              self._stride, self._paf_thickness)
-            for another_annotation in label['processed_other_annotations']:
-                keypoint_a = another_annotation['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][0]]
-                keypoint_b = another_annotation['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][1]]
-                if keypoint_a[2] <= 1 and keypoint_b[2] <= 1:
-                    self._set_paf(paf_maps[paf_idx * 2:paf_idx * 2 + 2],
-                                  keypoint_a[0], keypoint_a[1], keypoint_b[0], keypoint_b[1],
-                                  self._stride, self._paf_thickness)
-        return paf_maps
-
-    def _set_paf(self, paf_map, x_a, y_a, x_b, y_b, stride, thickness):
-        x_a /= stride
-        y_a /= stride
-        x_b /= stride
-        y_b /= stride
-        x_ba = x_b - x_a
-        y_ba = y_b - y_a
-        _, h_map, w_map = paf_map.shape
-        x_min = int(max(min(x_a, x_b) - thickness, 0))
-        x_max = int(min(max(x_a, x_b) + thickness, w_map))
-        y_min = int(max(min(y_a, y_b) - thickness, 0))
-        y_max = int(min(max(y_a, y_b) + thickness, h_map))
-        norm_ba = (x_ba * x_ba + y_ba * y_ba) ** 0.5
-        if norm_ba < 1e-7:  # Same points, no paf
-            return
-        x_ba /= norm_ba
-        y_ba /= norm_ba
-
-        for y in range(y_min, y_max):
-            for x in range(x_min, x_max):
-                x_ca = x - x_a
-                y_ca = y - y_a
-                d = math.fabs(x_ca * y_ba - y_ca * x_ba)
-                if d <= thickness:
-                    paf_map[0, y, x] = x_ba
-                    paf_map[1, y, x] = y_ba
-
-
-class CocoValDataset(Dataset):
-    def __init__(self, labels, images_folder):
-        super().__init__()
-        with open(labels, 'r') as f:
-            self._labels = json.load(f)
-        self._images_folder = images_folder
-
-    def __getitem__(self, idx):
-        file_name = self._labels['images'][idx]['file_name']
-        img = cv2.imread(os.path.join(self._images_folder, file_name), cv2.IMREAD_COLOR)
-        return {
-            'img': img,
-            'file_name': file_name
-        }
-
-    def __len__(self):
-        return len(self._labels['images'])
+import copy
+import json
+import math
+import os
+import pickle
+
+import cv2
+import numpy as np
+import pycocotools
+
+from torch.utils.data.dataset import Dataset
+
+BODY_PARTS_KPT_IDS = [[1, 8], [8, 9], [9, 10], [1, 11], [11, 12], [12, 13], [1, 2], [2, 3], [3, 4], [2, 16],
+                      [1, 5], [5, 6], [6, 7], [5, 17], [1, 0], [0, 14], [0, 15], [14, 16], [15, 17]]
+
+
+def get_mask(segmentations, mask):
+    for segmentation in segmentations:
+        rle = pycocotools.mask.frPyObjects(segmentation, mask.shape[0], mask.shape[1])
+        mask[pycocotools.mask.decode(rle) > 0.5] = 0
+    return mask
+
+
+class CocoTrainDataset(Dataset):
+    def __init__(self, labels, images_folder, stride, sigma, paf_thickness, transform=None):
+        super().__init__()
+        self._images_folder = images_folder
+        self._stride = stride
+        self._sigma = sigma
+        self._paf_thickness = paf_thickness
+        self._transform = transform
+        with open(labels, 'rb') as f:
+            self._labels = pickle.load(f)
+
+    def __getitem__(self, idx):
+        label = copy.deepcopy(self._labels[idx])  # label modified in transform
+        image = cv2.imread(os.path.join(self._images_folder, label['img_paths']), cv2.IMREAD_COLOR)
+        mask = np.ones(shape=(label['img_height'], label['img_width']), dtype=np.float32)
+        mask = get_mask(label['segmentations'], mask)
+        sample = {
+            'label': label,
+            'image': image,
+            'mask': mask
+        }
+        if self._transform:
+            sample = self._transform(sample)
+
+        mask = cv2.resize(sample['mask'], dsize=None, fx=1/self._stride, fy=1/self._stride, interpolation=cv2.INTER_AREA)
+        keypoint_maps = self._generate_keypoint_maps(sample)
+        sample['keypoint_maps'] = keypoint_maps
+        keypoint_mask = np.zeros(shape=keypoint_maps.shape, dtype=np.float32)
+        for idx in range(keypoint_mask.shape[0]):
+            keypoint_mask[idx] = mask
+        sample['keypoint_mask'] = keypoint_mask
+
+        paf_maps = self._generate_paf_maps(sample)
+        sample['paf_maps'] = paf_maps
+        paf_mask = np.zeros(shape=paf_maps.shape, dtype=np.float32)
+        for idx in range(paf_mask.shape[0]):
+            paf_mask[idx] = mask
+        sample['paf_mask'] = paf_mask
+
+        image = sample['image'].astype(np.float32)
+        image = (image - 128) / 256
+        sample['image'] = image.transpose((2, 0, 1))
+        del sample['label']
+        return sample
+
+    def __len__(self):
+        return len(self._labels)
+
+    def _generate_keypoint_maps(self, sample):
+        n_keypoints = 18
+        n_rows, n_cols, _ = sample['image'].shape
+        keypoint_maps = np.zeros(shape=(n_keypoints + 1,
+                                        n_rows // self._stride, n_cols // self._stride), dtype=np.float32)  # +1 for bg
+
+        label = sample['label']
+        for keypoint_idx in range(n_keypoints):
+            keypoint = label['keypoints'][keypoint_idx]
+            if keypoint[2] <= 1:
+                self._add_gaussian(keypoint_maps[keypoint_idx], keypoint[0], keypoint[1], self._stride, self._sigma)
+            for another_annotation in label['processed_other_annotations']:
+                keypoint = another_annotation['keypoints'][keypoint_idx]
+                if keypoint[2] <= 1:
+                    self._add_gaussian(keypoint_maps[keypoint_idx], keypoint[0], keypoint[1], self._stride, self._sigma)
+        keypoint_maps[-1] = 1 - keypoint_maps.max(axis=0)
+        return keypoint_maps
+
+    def _add_gaussian(self, keypoint_map, x, y, stride, sigma):
+        n_sigma = 4
+        tl = [int(x - n_sigma * sigma), int(y - n_sigma * sigma)]
+        tl[0] = max(tl[0], 0)
+        tl[1] = max(tl[1], 0)
+
+        br = [int(x + n_sigma * sigma), int(y + n_sigma * sigma)]
+        map_h, map_w = keypoint_map.shape
+        br[0] = min(br[0], map_w * stride)
+        br[1] = min(br[1], map_h * stride)
+
+        shift = stride / 2 - 0.5
+        for map_y in range(tl[1] // stride, br[1] // stride):
+            for map_x in range(tl[0] // stride, br[0] // stride):
+                d2 = (map_x * stride + shift - x) * (map_x * stride + shift - x) + \
+                    (map_y * stride + shift - y) * (map_y * stride + shift - y)
+                exponent = d2 / 2 / sigma / sigma
+                if exponent > 4.6052:  # threshold, ln(100), ~0.01
+                    continue
+                keypoint_map[map_y, map_x] += math.exp(-exponent)
+                if keypoint_map[map_y, map_x] > 1:
+                    keypoint_map[map_y, map_x] = 1
+
+    def _generate_paf_maps(self, sample):
+        n_pafs = len(BODY_PARTS_KPT_IDS)
+        n_rows, n_cols, _ = sample['image'].shape
+        paf_maps = np.zeros(shape=(n_pafs * 2, n_rows // self._stride, n_cols // self._stride), dtype=np.float32)
+
+        label = sample['label']
+        for paf_idx in range(n_pafs):
+            keypoint_a = label['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][0]]
+            keypoint_b = label['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][1]]
+            if keypoint_a[2] <= 1 and keypoint_b[2] <= 1:
+                self._set_paf(paf_maps[paf_idx * 2:paf_idx * 2 + 2],
+                              keypoint_a[0], keypoint_a[1], keypoint_b[0], keypoint_b[1],
+                              self._stride, self._paf_thickness)
+            for another_annotation in label['processed_other_annotations']:
+                keypoint_a = another_annotation['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][0]]
+                keypoint_b = another_annotation['keypoints'][BODY_PARTS_KPT_IDS[paf_idx][1]]
+                if keypoint_a[2] <= 1 and keypoint_b[2] <= 1:
+                    self._set_paf(paf_maps[paf_idx * 2:paf_idx * 2 + 2],
+                                  keypoint_a[0], keypoint_a[1], keypoint_b[0], keypoint_b[1],
+                                  self._stride, self._paf_thickness)
+        return paf_maps
+
+    def _set_paf(self, paf_map, x_a, y_a, x_b, y_b, stride, thickness):
+        x_a /= stride
+        y_a /= stride
+        x_b /= stride
+        y_b /= stride
+        x_ba = x_b - x_a
+        y_ba = y_b - y_a
+        _, h_map, w_map = paf_map.shape
+        x_min = int(max(min(x_a, x_b) - thickness, 0))
+        x_max = int(min(max(x_a, x_b) + thickness, w_map))
+        y_min = int(max(min(y_a, y_b) - thickness, 0))
+        y_max = int(min(max(y_a, y_b) + thickness, h_map))
+        norm_ba = (x_ba * x_ba + y_ba * y_ba) ** 0.5
+        if norm_ba < 1e-7:  # Same points, no paf
+            return
+        x_ba /= norm_ba
+        y_ba /= norm_ba
+
+        for y in range(y_min, y_max):
+            for x in range(x_min, x_max):
+                x_ca = x - x_a
+                y_ca = y - y_a
+                d = math.fabs(x_ca * y_ba - y_ca * x_ba)
+                if d <= thickness:
+                    paf_map[0, y, x] = x_ba
+                    paf_map[1, y, x] = y_ba
+
+
+class CocoValDataset(Dataset):
+    def __init__(self, labels, images_folder):
+        super().__init__()
+        with open(labels, 'r') as f:
+            self._labels = json.load(f)
+        self._images_folder = images_folder
+
+    def __getitem__(self, idx):
+        file_name = self._labels['images'][idx]['file_name']
+        img = cv2.imread(os.path.join(self._images_folder, file_name), cv2.IMREAD_COLOR)
+        return {
+            'img': img,
+            'file_name': file_name
+        }
+
+    def __len__(self):
+        return len(self._labels['images'])