getting some kind of baseline result but they're still garbage

anushkaray · anushkaray · commit 2331b9a3e359 · 2022-03-14T22:30:44.000Z
diff --git a/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py b/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py
@@ -4,12 +4,19 @@
 #     '../_base_/schedules/schedule_160k.py'
 # ]
 
+# _base_ = [
+#     '../_base_/models/segmenter_vit-b16_mask.py',
+#     '../_base_/datasets/aerial.py', '../_base_/default_runtime.py',
+#     '../_base_/schedules/schedule_160k.py'
+# ]
+
 _base_ = [
     '../_base_/models/segmenter_vit-b16_mask.py',
     '../_base_/datasets/aerial.py', '../_base_/default_runtime.py',
     '../_base_/schedules/schedule_160k.py'
 ]
 
+
 checkpoint = 'https://download.openmmlab.com/mmsegmentation/v0.5/pretrain/segmenter/vit_small_p16_384_20220308-410f6037.pth'  # noqa
 
 backbone_norm_cfg = dict(type='LN', eps=1e-6, requires_grad=True)
diff --git a/demo/inference_demo_2.ipynb b/demo/inference_demo_2.ipynb
diff --git a/mmseg/apis/test.py b/mmseg/apis/test.py
@@ -78,6 +78,7 @@ def single_gpu_test(model,
     model.eval()
     results = []
     dataset = data_loader.dataset
+    # print("DATASET LINE 81: ", dataset)
     prog_bar = mmcv.ProgressBar(len(dataset))
     # The pipeline about how the data_loader retrieval samples from dataset:
     # sampler -> batch_sampler -> indices
@@ -107,6 +108,7 @@ def single_gpu_test(model,
                     out_file = osp.join(out_dir, img_meta['ori_filename'])
                 else:
                     out_file = None
+                # print("dataset.PALETTE!!!! ", dataset.PALETTE)
 
                 model.module.show_result(
                     img_show,
diff --git a/mmseg/core/evaluation/metrics.py b/mmseg/core/evaluation/metrics.py
@@ -4,6 +4,7 @@
 import mmcv
 import numpy as np
 import torch
+import torchvision.transforms.functional as tf
 
 
 def f_score(precision, recall, beta=1):
@@ -62,16 +63,24 @@ def intersect_and_union(pred_label,
             mmcv.imread(label, flag='unchanged', backend='pillow'))
     else:
         label = torch.from_numpy(label)
-
+    # print("label map ", label_map)
     if label_map is not None:
         for old_id, new_id in label_map.items():
             label[label == old_id] = new_id
     if reduce_zero_label:
         label[label == 0] = 255
         label = label - 1
         label[label == 254] = 255
-
+    # label = tf.rgb_to_grayscale(label, 1)
+    # print("label shape ", label.shape)
+    # print("pred label: ", torch.max(pred_label))
+    label = label[:,:,0]
+    # print("label shape after ", label.shape)
     mask = (label != ignore_index)
+    # print("pred label: ", pred_label)
+    # print("pred label shape: ", pred_label.shape)
+    # print("mask: ", mask)
+    # print("mask shape: ", mask.shape)
     pred_label = pred_label[mask]
     label = label[mask]
 
diff --git a/mmseg/datasets/aerial.py b/mmseg/datasets/aerial.py
@@ -18,17 +18,87 @@ class AerialDataset(CustomDataset):
     The ``img_suffix`` is fixed to '.jpg' and ``seg_map_suffix`` is fixed to
     '.png'.
     """
-    CLASSES = ('paved-area', 'dirt', 'grass', 'gravel', 'water', 'rocks', 'pool', 'vegetation', 
-               'roof', 'wall', 'window', 'door', 'fence', 'fence-pole', 'person', 'dog', 'car', 'bicycle', 'tree', 'bald-tree', 'ar-marker', 'obstacle', 'conflicting', 'unlabeled')
-
-    PALETTE = [[128, 64, 128], [130, 76, 0], [0, 102, 0], [112, 103, 87], [28, 42, 168], [48, 41, 30], [0, 50, 89], [107, 142, 35], [70, 70, 70], [102, 102, 156], [254, 228, 12], [254, 148, 12], [190, 153, 153], [153, 153, 153], [255, 22, 96], [102, 51, 0], [9, 143, 150], [119, 11, 32], [51, 51, 0], [190, 250, 190], [112, 150, 146], [2, 135, 115], [255, 0, 0], [0, 0, 0]]
+    AERIAL_CLASSES = ('sidewalk', 'earth', 'grass', 'sand', 'water', 'rock', 'swimming pool', 'plant', 
+               'building', 'wall', 'windowpane', 'door', 'fence', 'pole', 'person', 'animal', 'car', 'bicycle', 'tree', 'television receiver', 'microwave', 'coffee table', 'trade name', 'sconce')
+    CLASSES = (
+        'wall', 'building', 'sky', 'floor', 'tree', 'ceiling', 'road', 'bed ',
+        'windowpane', 'grass', 'cabinet', 'sidewalk', 'person', 'earth',
+        'door', 'table', 'mountain', 'plant', 'curtain', 'chair', 'car',
+        'water', 'painting', 'sofa', 'shelf', 'house', 'sea', 'mirror', 'rug',
+        'field', 'armchair', 'seat', 'fence', 'desk', 'rock', 'wardrobe',
+        'lamp', 'bathtub', 'railing', 'cushion', 'base', 'box', 'column',
+        'signboard', 'chest of drawers', 'counter', 'sand', 'sink',
+        'skyscraper', 'fireplace', 'refrigerator', 'grandstand', 'path',
+        'stairs', 'runway', 'case', 'pool table', 'pillow', 'screen door',
+        'stairway', 'river', 'bridge', 'bookcase', 'blind', 'coffee table',
+        'toilet', 'flower', 'book', 'hill', 'bench', 'countertop', 'stove',
+        'palm', 'kitchen island', 'computer', 'swivel chair', 'boat', 'bar',
+        'arcade machine', 'hovel', 'bus', 'towel', 'light', 'truck', 'tower',
+        'chandelier', 'awning', 'streetlight', 'booth', 'television receiver',
+        'airplane', 'dirt track', 'apparel', 'pole', 'land', 'bannister',
+        'escalator', 'ottoman', 'bottle', 'buffet', 'poster', 'stage', 'van',
+        'ship', 'fountain', 'conveyer belt', 'canopy', 'washer', 'plaything',
+        'swimming pool', 'stool', 'barrel', 'basket', 'waterfall', 'tent',
+        'bag', 'minibike', 'cradle', 'oven', 'ball', 'food', 'step', 'tank',
+        'trade name', 'microwave', 'pot', 'animal', 'bicycle', 'lake',
+        'dishwasher', 'screen', 'blanket', 'sculpture', 'hood', 'sconce',
+        'vase', 'traffic light', 'tray', 'ashcan', 'fan', 'pier', 'crt screen',
+        'plate', 'monitor', 'bulletin board', 'shower', 'radiator', 'glass',
+        'clock', 'flag')
+
+    AERIAL_PALETTE = [[128, 64, 128], [130, 76, 0], [0, 102, 0], [112, 103, 87], [28, 42, 168], [48, 41, 30], [0, 50, 89], [107, 142, 35], [70, 70, 70], [102, 102, 156], [254, 228, 12], [254, 148, 12], [190, 153, 153], [153, 153, 153], [255, 22, 96], [102, 51, 0], [9, 143, 150], [119, 11, 32], [51, 51, 0], [190, 250, 190], [112, 150, 146], [2, 135, 115], [255, 0, 0], [0, 0, 0]]
+    PALETTE = [[120, 120, 120], [180, 120, 120], [6, 230, 230], [80, 50, 50],
+               [4, 200, 3], [120, 120, 80], [140, 140, 140], [204, 5, 255],
+               [230, 230, 230], [4, 250, 7], [224, 5, 255], [235, 255, 7],
+               [150, 5, 61], [120, 120, 70], [8, 255, 51], [255, 6, 82],
+               [143, 255, 140], [204, 255, 4], [255, 51, 7], [204, 70, 3],
+               [0, 102, 200], [61, 230, 250], [255, 6, 51], [11, 102, 255],
+               [255, 7, 71], [255, 9, 224], [9, 7, 230], [220, 220, 220],
+               [255, 9, 92], [112, 9, 255], [8, 255, 214], [7, 255, 224],
+               [255, 184, 6], [10, 255, 71], [255, 41, 10], [7, 255, 255],
+               [224, 255, 8], [102, 8, 255], [255, 61, 6], [255, 194, 7],
+               [255, 122, 8], [0, 255, 20], [255, 8, 41], [255, 5, 153],
+               [6, 51, 255], [235, 12, 255], [160, 150, 20], [0, 163, 255],
+               [140, 140, 140], [250, 10, 15], [20, 255, 0], [31, 255, 0],
+               [255, 31, 0], [255, 224, 0], [153, 255, 0], [0, 0, 255],
+               [255, 71, 0], [0, 235, 255], [0, 173, 255], [31, 0, 255],
+               [11, 200, 200], [255, 82, 0], [0, 255, 245], [0, 61, 255],
+               [0, 255, 112], [0, 255, 133], [255, 0, 0], [255, 163, 0],
+               [255, 102, 0], [194, 255, 0], [0, 143, 255], [51, 255, 0],
+               [0, 82, 255], [0, 255, 41], [0, 255, 173], [10, 0, 255],
+               [173, 255, 0], [0, 255, 153], [255, 92, 0], [255, 0, 255],
+               [255, 0, 245], [255, 0, 102], [255, 173, 0], [255, 0, 20],
+               [255, 184, 184], [0, 31, 255], [0, 255, 61], [0, 71, 255],
+               [255, 0, 204], [0, 255, 194], [0, 255, 82], [0, 10, 255],
+               [0, 112, 255], [51, 0, 255], [0, 194, 255], [0, 122, 255],
+               [0, 255, 163], [255, 153, 0], [0, 255, 10], [255, 112, 0],
+               [143, 255, 0], [82, 0, 255], [163, 255, 0], [255, 235, 0],
+               [8, 184, 170], [133, 0, 255], [0, 255, 92], [184, 0, 255],
+               [255, 0, 31], [0, 184, 255], [0, 214, 255], [255, 0, 112],
+               [92, 255, 0], [0, 224, 255], [112, 224, 255], [70, 184, 160],
+               [163, 0, 255], [153, 0, 255], [71, 255, 0], [255, 0, 163],
+               [255, 204, 0], [255, 0, 143], [0, 255, 235], [133, 255, 0],
+               [255, 0, 235], [245, 0, 255], [255, 0, 122], [255, 245, 0],
+               [10, 190, 212], [214, 255, 0], [0, 204, 255], [20, 0, 255],
+               [255, 255, 0], [0, 153, 255], [0, 41, 255], [0, 255, 204],
+               [41, 0, 255], [41, 255, 0], [173, 0, 255], [0, 245, 255],
+               [71, 0, 255], [122, 0, 255], [0, 255, 184], [0, 92, 255],
+               [184, 255, 0], [0, 133, 255], [255, 214, 0], [25, 194, 194],
+               [102, 255, 0], [92, 0, 255]]
+    # PALETTE = None
+    # CLASSES = None
 
     def __init__(self, **kwargs):
         super(AerialDataset, self).__init__(
             img_suffix='.jpg',
             seg_map_suffix='.png',
             reduce_zero_label=True,
-            **kwargs)
+            **kwargs
+            )
+        self.CLASSES, self.PALETTE = self.get_classes_and_palette(self.AERIAL_CLASSES, self.AERIAL_PALETTE)
+        # print("self.classes len ", len(self.CLASSES))
+        # print("self.palette len ", len(self.PALETTE))
+
 
     def results2img(self, results, imgfile_prefix, to_label_id, indices=None):
         """Write the segmentation results to images.
@@ -49,6 +119,7 @@ def results2img(self, results, imgfile_prefix, to_label_id, indices=None):
             list[str: str]: result txt files which contains corresponding
             semantic segmentation images.
         """
+        print("IN RESULTS 2 IMG")
         if indices is None:
             indices = list(range(len(self)))
 
@@ -95,7 +166,7 @@ def format_results(self,
                the image paths, tmp_dir is the temporal directory created
                 for saving json/png files when img_prefix is not specified.
         """
-
+        print("IN FORMAT RESULTS")
         if indices is None:
             indices = list(range(len(self)))
 
@@ -105,3 +176,5 @@ def format_results(self,
         result_files = self.results2img(results, imgfile_prefix, to_label_id,
                                         indices)
         return result_files
+
+        
diff --git a/mmseg/datasets/custom.py b/mmseg/datasets/custom.py
@@ -282,9 +282,11 @@ def pre_eval(self, preds, indices):
             preds = [preds]
 
         pre_eval_results = []
-
+        # print("preds shape: ", preds[0].shape)
         for pred, index in zip(preds, indices):
             seg_map = self.get_gt_seg_map_by_idx(index)
+            # print("seg map shape: ", seg_map.shape)
+            # print("pred shape: ", pred.shape)
             pre_eval_results.append(
                 intersect_and_union(pred, seg_map, len(self.CLASSES),
                                     self.ignore_index, self.label_map,
@@ -305,6 +307,8 @@ def get_classes_and_palette(self, classes=None, palette=None):
                 The palette of segmentation map. If None is given, random
                 palette will be generated. Default: None
         """
+        # print("print classes!!: ", classes)
+        # print("print palette!!: ", palette)
         if classes is None:
             self.custom_classes = False
             return self.CLASSES, self.PALETTE
@@ -326,14 +330,18 @@ def get_classes_and_palette(self, classes=None, palette=None):
             # are the new label ids.
             # used for changing pixel labels in load_annotations.
             self.label_map = {}
+            # print("class_names ", class_names)
             for i, c in enumerate(self.CLASSES):
                 if c not in class_names:
                     self.label_map[i] = -1
                 else:
                     self.label_map[i] = class_names.index(c)
-
+        # print("self.label_map!!!!!: ", self.label_map)
+        print("print classes!! before: ", class_names)
+        print("print palette!! before: ", palette)
         palette = self.get_palette_for_custom_classes(class_names, palette)
-
+        print("print classes!! after: ", class_names)
+        print("print palette!! after: ", palette)
         return class_names, palette
 
     def get_palette_for_custom_classes(self, class_names, palette=None):
diff --git a/mmseg/datasets/pipelines/loading.py b/mmseg/datasets/pipelines/loading.py
@@ -120,6 +120,7 @@ def __call__(self, results):
         Returns:
             dict: The dict contains loaded semantic segmentation annotations.
         """
+        print("AYOOOOOOOOOOOO")
 
         if self.file_client is None:
             self.file_client = mmcv.FileClient(**self.file_client_args)
diff --git a/mmseg/models/segmentors/base.py b/mmseg/models/segmentors/base.py
@@ -243,6 +243,7 @@ def show_result(self,
         img = mmcv.imread(img)
         img = img.copy()
         seg = result[0]
+        # print("self classes ", self.CLASSES)
         if palette is None:
             if self.PALETTE is None:
                 # Get random state before set seed,
@@ -259,6 +260,8 @@ def show_result(self,
             else:
                 palette = self.PALETTE
         palette = np.array(palette)
+        print("PALETTE SHAPE 0 ", palette.shape[0])
+        print("LEN SELF CLASSES ", len(self.CLASSES))
         assert palette.shape[0] == len(self.CLASSES)
         assert palette.shape[1] == 3
         assert len(palette.shape) == 2
diff --git a/tools/test.py b/tools/test.py
@@ -191,6 +191,7 @@ def main():
     # build the dataloader
     # TODO: support multiple images per gpu (only minor changes are needed)
     dataset = build_dataset(cfg.data.test)
+    print("Dataset!: ", dataset)
     data_loader = build_dataloader(
         dataset,
         samples_per_gpu=1,
@@ -205,11 +206,11 @@ def main():
     if fp16_cfg is not None:
         wrap_fp16_model(model)
     checkpoint = load_checkpoint(model, args.checkpoint, map_location='cpu')
-    if 'CLASSES' in checkpoint.get('meta', {}):
-        model.CLASSES = checkpoint['meta']['CLASSES']
-    else:
-        print('"CLASSES" not found in meta, use dataset.CLASSES instead')
-        model.CLASSES = dataset.CLASSES
+    # if 'CLASSES' in checkpoint.get('meta', {}):
+    #     model.CLASSES = checkpoint['meta']['CLASSES']
+    # else:
+    print('"CLASSES" not found in meta, use dataset.CLASSES instead')
+    model.CLASSES = dataset.CLASSES
     if 'PALETTE' in checkpoint.get('meta', {}):
         model.PALETTE = checkpoint['meta']['PALETTE']
     else:
@@ -254,6 +255,8 @@ def main():
                 'Please use MMCV >= 1.4.4 for CPU training!'
         model = revert_sync_batchnorm(model)
         model = MMDataParallel(model, device_ids=cfg.gpu_ids)
+        # print("MODEL ", model)
+        # print("DATA LOADER ", data_loader)
         results = single_gpu_test(
             model,
             data_loader,