FCN

YunYang1994 · YunYang1994 · commit 22b3ebb4ba8e · 2019-10-23T23:29:11.000+08:00
diff --git a/5-Image_Segmentation/FCN/README.md b/5-Image_Segmentation/FCN/README.md
@@ -10,12 +10,14 @@
 ## Train PASCAL VOC2012
 --------------------
 Download VOC PASCAL trainval and test data. 
+
 ```bashrc
 $ wget http://host.robots.ox.ac.uk/pascal/VOC/voc2007/VOCtrainval_06-Nov-2007.tar
 $ wget http://host.robots.ox.ac.uk/pascal/VOC/voc2012/VOCtrainval_11-May-2012.tar
 $ wget http://host.robots.ox.ac.uk/pascal/VOC/voc2007/VOCtest_06-Nov-2007.tar
 ```
 Extract all of these tars into one directory and rename them, which should have the following basic structure.
+
 ```bashrc
 VOC           # path:  /home/yang/dataset/VOC
 ├── test
@@ -26,7 +28,8 @@ VOC           # path:  /home/yang/dataset/VOC
          └──VOC2007 (from VOCtrainval_06-Nov-2007.tar)
          └──VOC2012 (from VOCtrainval_11-May-2012.tar)
 ```
-Finally you need to make some transformation and train it.
+Finally you need to make some transformation and train it. Here is my trained weight
+
 ```bashrc
 $ python parser_voc.py --voc_path /home/yang/dataset/VOC
 $ python train.py
@@ -37,6 +40,8 @@ Epoch 2/30
 ...
 Epoch 30/30
 6000/6000 [==============================] - 3552s 592ms/step - loss: 0.0811 - accuracy: 0.9797
+
+$ python test.py
 ```
 
 |![image](https://user-images.githubusercontent.com/30433053/66732790-d4d56680-ee8f-11e9-9120-07b0e8aa53d4.jpg)|![image](https://user-images.githubusercontent.com/30433053/66732791-d69f2a00-ee8f-11e9-9c5d-16cc84bc7e9e.jpg)|![image](https://user-images.githubusercontent.com/30433053/66732795-da32b100-ee8f-11e9-9d85-f0ddba7a3ab1.jpg)|
diff --git a/5-Image_Segmentation/FCN/config.py b/5-Image_Segmentation/FCN/config.py
diff --git a/5-Image_Segmentation/FCN/parser_voc.py b/5-Image_Segmentation/FCN/parser_voc.py
@@ -20,6 +20,7 @@
 if not os.path.exists("./data"): os.mkdir("./data")
 if not os.path.exists("./data/train_labels"): os.mkdir("./data/train_labels")
 if not os.path.exists("./data/test_labels"): os.mkdir("./data/test_labels")
+if not os.path.exists("./data/prediction"): os.mkdir("./data/prediction")
 
 parser = argparse.ArgumentParser()
 parser.add_argument("--voc_path", type=str, default="/home/yang/dataset/VOC")
diff --git a/5-Image_Segmentation/FCN/test.py b/5-Image_Segmentation/FCN/test.py
@@ -0,0 +1,40 @@
+#! /usr/bin/env python
+# coding=utf-8
+#================================================================
+#   Copyright (C) 2019 * Ltd. All rights reserved.
+#
+#   Editor      : VIM
+#   File name   : test.py
+#   Author      : YunYang1994
+#   Created date: 2019-10-23 23:14:38
+#   Description :
+#
+#================================================================
+
+import numpy as np
+import tensorflow as tf
+
+from fcn8s import FCN8s
+from utils import visual_result, DataGenerator
+
+model = FCN8s(n_class=21)
+TestSet  = DataGenerator("./data/test_image.txt", "./data/test_labels", 1)
+
+## load weights and test your model after training
+## if you want to test model, first you need to initialize your model
+## with "model(data)", and then load model weights
+data = np.ones(shape=[1,224,224,3], dtype=np.float)
+model(data)
+model.load_weights("FCN8s.h5")
+
+for idx, (x, y) in enumerate(TestSet):
+    result = model(x)
+    pred_label = tf.argmax(result, axis=-1)
+    result = visual_result(x[0], pred_label[0].numpy())
+    save_file = "./data/prediction/%d.jpg" %idx
+    print("=> saving prediction result into ", save_file)
+    result.save(save_file)
+    if idx == 209:
+        result.show()
+        break
+
diff --git a/5-Image_Segmentation/FCN/train.py b/5-Image_Segmentation/FCN/train.py
@@ -11,131 +11,18 @@
 #
 #================================================================
 
-import os
-import cv2
-import random
 import tensorflow as tf
-import numpy as np
 from fcn8s import FCN8s
-from PIL import Image
-from config import colormap, classes, rgb_mean, rgb_std
-
-
-def create_image_label_path_generator(images_filepath, labels_filepath):
-    image_paths = open(images_filepath).readlines()
-    all_label_txts = os.listdir(labels_filepath)
-    image_label_paths = []
-    for label_txt in all_label_txts:
-        label_name = label_txt[:-4]
-        label_path = labels_filepath + "/" + label_txt
-        for image_path in image_paths:
-            image_path = image_path.rstrip()
-            image_name = image_path.split("/")[-1][:-4]
-            if label_name == image_name:
-                image_label_paths.append((image_path, label_path))
-    while True:
-        random.shuffle(image_label_paths)
-        for i in range(len(image_label_paths)):
-            yield image_label_paths[i]
-
-
-def process_image_label(image_path, label_path):
-    # image = misc.imread(image_path)
-    image = cv2.imread(image_path)
-    image = cv2.resize(image, (224, 224), interpolation=cv2.INTER_NEAREST)
-    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
-    # data augmentation here
-    # pass
-    # image transformation here
-    image = (image / 255. - rgb_mean) / rgb_std
-
-    label = open(label_path).readlines()
-    label = [np.array(line.rstrip().split(" ")) for line in label]
-    label = np.array(label, dtype=np.int)
-    label = cv2.resize(label, (224, 224), interpolation=cv2.INTER_NEAREST)
-    label = label.astype(np.int)
-
-    return image, label
-
-
-def DataGenerator(train_image_txt, train_labels_dir, batch_size):
-    """
-    generate image and mask at the same time
-    """
-    image_label_path_generator = create_image_label_path_generator(
-        train_image_txt, train_labels_dir
-    )
-    while True:
-        images = np.zeros(shape=[batch_size, 224, 224, 3])
-        labels = np.zeros(shape=[batch_size, 224, 224], dtype=np.float)
-        for i in range(batch_size):
-            image_path, label_path = next(image_label_path_generator)
-            image, label = process_image_label(image_path, label_path)
-            images[i], labels[i] = image, label
-        yield images, labels
-
-
-def visual_result(image, label, alpha=0.7):
-    """
-    image shape -> [H, W, C]
-    label shape -> [H, W]
-    """
-    image = (image * rgb_std + rgb_mean) * 255
-    image, label = image.astype(np.int), label.astype(np.int)
-    H, W, C = image.shape
-    masks_color = np.zeros(shape=[H, W, C])
-    inv_masks_color = np.zeros(shape=[H, W, C])
-    cls = []
-    for i in range(H):
-        for j in range(W):
-            cls_idx = label[i, j]
-            masks_color[i, j] = np.array(colormap[cls_idx])
-            cls.append(cls_idx)
-            if classes[cls_idx] == "background":
-                inv_masks_color[i, j] = alpha * image[i, j]
-
-    show_image = np.zeros(shape=[224, 672, 3])
-    cls = set(cls)
-    for x in cls:
-        print("=> ", classes[x])
-    show_image[:, :224, :] = image
-    show_image[:, 224:448, :] = masks_color
-    show_image[:, 448:, :] = (1-alpha)*image + alpha*masks_color + inv_masks_color
-    show_image = Image.fromarray(np.uint8(show_image))
-    return show_image
+from utils import DataGenerator
 
 TrainSet = DataGenerator("./data/train_image.txt", "./data/train_labels", 2)
-TestSet  = DataGenerator("./data/test_image.txt", "./data/test_labels", 1)
-
 model = FCN8s(n_class=21)
-callback = tf.keras.callbacks.ModelCheckpoint("model.h5", verbose=1, save_weights_only=True)
+callback = tf.keras.callbacks.ModelCheckpoint("FCN8s.h5", verbose=1, save_weights_only=True)
 model.compile(optimizer=tf.keras.optimizers.Adam(lr=1e-4),
               callback=callback,
               loss='sparse_categorical_crossentropy',
               metrics=['accuracy'])
 
 ## train your FCN8s model
 model.fit_generator(TrainSet, steps_per_epoch=6000, epochs=30)
-model.save_weights("model.h5")
-
-## load weights and test your model after training
-## if you want to test model, first you need to initialize your model
-## with "model(data)", and then load model weights
-
-# data = np.ones(shape=[1,224,224,3], dtype=np.float)
-# model(data)
-# model.load_weights("model.h5")
-
-for idx, (x, y) in enumerate(TestSet):
-    result = model(x)
-    pred_label = tf.argmax(result, axis=-1)
-    result = visual_result(x[0], pred_label[0].numpy())
-    save_file = "./data/prediction/%d.jpg" %idx
-    print("=> saving prediction result into ", save_file)
-    result.save(save_file)
-    if idx == 209:
-        result.show()
-        break
-
-
 
diff --git a/5-Image_Segmentation/FCN/utils.py b/5-Image_Segmentation/FCN/utils.py
@@ -0,0 +1,114 @@
+#! /usr/bin/env python
+# coding=utf-8
+#================================================================
+#   Copyright (C) 2019 * Ltd. All rights reserved.
+#
+#   Editor      : VIM
+#   File name   : utils.py
+#   Author      : YunYang1994
+#   Created date: 2019-10-12 17:47:24
+#   Description :
+#
+#================================================================
+
+import os
+import cv2
+import random
+import numpy as np
+
+from PIL import Image
+
+classes = ['background','aeroplane','bicycle','bird','boat',
+           'bottle','bus','car','cat','chair','cow','diningtable',
+           'dog','horse','motorbike','person','potted plant',
+           'sheep','sofa','train','tv/monitor']
+# RGB color for each class
+colormap = [[0,0,0],[128,0,0],[0,128,0], [128,128,0], [0,0,128],
+            [128,0,128],[0,128,128],[128,128,128],[64,0,0],[192,0,0],
+            [64,128,0],[192,128,0],[64,0,128],[192,0,128],
+            [64,128,128],[192,128,128],[0,64,0],[128,64,0],
+            [0,192,0],[128,192,0],[0,64,128]]
+
+rgb_mean = np.array([0.485, 0.456, 0.406])
+rgb_std = np.array([0.229, 0.224, 0.225])
+
+def visual_result(image, label, alpha=0.7):
+    """
+    image shape -> [H, W, C]
+    label shape -> [H, W]
+    """
+    image = (image * rgb_std + rgb_mean) * 255
+    image, label = image.astype(np.int), label.astype(np.int)
+    H, W, C = image.shape
+    masks_color = np.zeros(shape=[H, W, C])
+    inv_masks_color = np.zeros(shape=[H, W, C])
+    cls = []
+    for i in range(H):
+        for j in range(W):
+            cls_idx = label[i, j]
+            masks_color[i, j] = np.array(colormap[cls_idx])
+            cls.append(cls_idx)
+            if classes[cls_idx] == "background":
+                inv_masks_color[i, j] = alpha * image[i, j]
+
+    show_image = np.zeros(shape=[224, 672, 3])
+    cls = set(cls)
+    for x in cls:
+        print("=> ", classes[x])
+    show_image[:, :224, :] = image
+    show_image[:, 224:448, :] = masks_color
+    show_image[:, 448:, :] = (1-alpha)*image + alpha*masks_color + inv_masks_color
+    show_image = Image.fromarray(np.uint8(show_image))
+    return show_image
+
+def create_image_label_path_generator(images_filepath, labels_filepath):
+    image_paths = open(images_filepath).readlines()
+    all_label_txts = os.listdir(labels_filepath)
+    image_label_paths = []
+    for label_txt in all_label_txts:
+        label_name = label_txt[:-4]
+        label_path = labels_filepath + "/" + label_txt
+        for image_path in image_paths:
+            image_path = image_path.rstrip()
+            image_name = image_path.split("/")[-1][:-4]
+            if label_name == image_name:
+                image_label_paths.append((image_path, label_path))
+    while True:
+        random.shuffle(image_label_paths)
+        for i in range(len(image_label_paths)):
+            yield image_label_paths[i]
+
+def process_image_label(image_path, label_path):
+    # image = misc.imread(image_path)
+    image = cv2.imread(image_path)
+    image = cv2.resize(image, (224, 224), interpolation=cv2.INTER_NEAREST)
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    # data augmentation here
+    # pass
+    # image transformation here
+    image = (image / 255. - rgb_mean) / rgb_std
+
+    label = open(label_path).readlines()
+    label = [np.array(line.rstrip().split(" ")) for line in label]
+    label = np.array(label, dtype=np.int)
+    label = cv2.resize(label, (224, 224), interpolation=cv2.INTER_NEAREST)
+    label = label.astype(np.int)
+
+    return image, label
+
+
+def DataGenerator(train_image_txt, train_labels_dir, batch_size):
+    """
+    generate image and mask at the same time
+    """
+    image_label_path_generator = create_image_label_path_generator(
+        train_image_txt, train_labels_dir
+    )
+    while True:
+        images = np.zeros(shape=[batch_size, 224, 224, 3])
+        labels = np.zeros(shape=[batch_size, 224, 224], dtype=np.float)
+        for i in range(batch_size):
+            image_path, label_path = next(image_label_path_generator)
+            image, label = process_image_label(image_path, label_path)
+            images[i], labels[i] = image, label
+        yield images, labels