add code

신아형
Commit 01f5db31ed3b4b3e3a0879a14c6a73f3f15b356e 01f5db31 1 parent 08cb83fd
Showing 5 changed files with 252 additions and 0 deletions
code/augmentation.ipynb
code/generate_tfrecord.py
code/object_detection.ipynb
code/txt_to_csv.ipynb
code/xml_to_csv.py
--- a/code/augmentation.ipynb 0 → 100644
View file @01f5db3
+++ b/code/augmentation.ipynb 0 → 100644
View file @01f5db3
+{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"name":"augmentation.ipynb","provenance":[],"collapsed_sections":[],"authorship_tag":"ABX9TyM0lQ+UqU7Sa/uXs3VwvxDl"},"kernelspec":{"name":"python3","display_name":"Python 3"}},"cells":[{"cell_type":"code","metadata":{"id":"wYGqloqDkEoU","colab_type":"code","outputId":"0d22028c-119d-4823-df3f-35d439ca019f","executionInfo":{"status":"ok","timestamp":1591716524562,"user_tz":-540,"elapsed":32835,"user":{"displayName":"‍신아형[학생](소프트웨어융합대학 컴퓨터공학과)","photoUrl":"","userId":"02057930622140727302"}},"colab":{"base_uri":"https://localhost:8080/","height":127}},"source":["from google.colab import drive\n","drive.mount('/content/gdrive')"],"execution_count":0,"outputs":[{"output_type":"stream","text":["Go to this URL in a browser: https://accounts.google.com/o/oauth2/auth?client_id=947318989803-6bn6qk8qdgf4n4g3pfee6491hc0brc4i.apps.googleusercontent.com&redirect_uri=urn%3aietf%3awg%3aoauth%3a2.0%3aoob&response_type=code&scope=email%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdocs.test%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdrive%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdrive.photos.readonly%20https%3a%2f%2fwww.googleapis.com%2fauth%2fpeopleapi.readonly\n","\n","Enter your authorization code:\n","··········\n","Mounted at /content/gdrive\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"cPpLXwOPGYkB","colab_type":"code","colab":{}},"source":["import imgaug; print(imgaug.__file__)\n","!cd /content/../usr/local/lib/python3.6/dist-packages/\n","!pip uninstall imgaug\n","!pip install git+https://github.com/aleju/imgaug.git\n","!pip3 install pascal_voc_writer"],"execution_count":0,"outputs":[]},{"cell_type":"code","metadata":{"id":"3WumbxkdSAYo","colab_type":"code","colab":{}},"source":["# xml파일 파싱해서 filename, bounding-box 정보 반환\n","\n","import xml.etree.ElementTree as ET\n","\n","def read_anntation(xml_file: str):\n","    tree = ET.parse(xml_file)\n","    root = tree.getroot()\n","\n","    bounding_box_list = []\n","\n","    file_name = root.find('filename').text\n","    for obj in root.iter('object'):\n","\n","        object_label = obj.find(\"name\").text\n","        for box in obj.findall(\"bndbox\"):\n","            x_min = int(box.find(\"xmin\").text)\n","            y_min = int(box.find(\"ymin\").text)\n","            x_max = int(box.find(\"xmax\").text)\n","            y_max = int(box.find(\"ymax\").text)\n","\n","        bounding_box = [object_label, x_min, y_min, x_max, y_max]\n","        bounding_box_list.append(bounding_box)\n","\n","    return bounding_box_list, file_name"],"execution_count":0,"outputs":[]},{"cell_type":"code","metadata":{"id":"A-982sMgSOCV","colab_type":"code","colab":{}},"source":["# 4차원 nparray로 변환된 이미지, [bounding-box 리스트, xml 파일명, 이미지 파일명] 리스트 반환\n","\n","from os import listdir\n","import cv2\n","import numpy as np\n","\n","def read_train_dataset(dir):\n","    images = []\n","    annotations = []\n","\n","    for file in listdir(dir):\n","        if 'jpg' in file.lower() or 'png' in file.lower():\n","            images.append(cv2.imread(dir + file, 1))\n","            annotation_file = file.replace(file.split('.')[-1], 'xml')\n","            bounding_box_list, file_name = read_anntation(dir + annotation_file)\n","            annotations.append((bounding_box_list, annotation_file, file_name))\n","\n","    images = np.array(images)\n","\n","    return images, annotations"],"execution_count":0,"outputs":[]},{"cell_type":"code","metadata":{"id":"5Kz66PqlST6Q","colab_type":"code","colab":{}},"source":["import imgaug as ia\n","from imgaug import augmenters as iaa\n","from pascal_voc_writer import Writer\n","\n","ia.seed(1)\n","\n","\n","dir = '/content/gdrive/My Drive/capstone/data/'   # input 이미지 디렉토리\n","output_dir='/content/gdrive/My Drive/capstone/data/'   # output 이미지 디렉토리\n","\n","images, annotations = read_train_dataset(dir)\n","\n","for idx in range(len(images)):\n","    image = images[idx]\n","    boxes = annotations[idx][0]\n","\n","    ia_bounding_boxes = []\n","    for box in boxes:\n","        ia_bounding_boxes.append(ia.BoundingBox(x1=box[1], y1=box[2], x2=box[3], y2=box[4]))\n","    bbs = ia.BoundingBoxesOnImage(ia_bounding_boxes, shape=image.shape)\n","\n","    ######어둡게\n","    seq = iaa.MultiplyAndAddToBrightness(mul=(0.5, 0.5), add=(-10, 10))\n","\n","    ######밝게\n","    #seq = iaa.MultiplyAndAddToBrightness(mul= (1, 2.5), add=(-15, 15))\n","\n","    seq_det = seq.to_deterministic()\n","\n","    image_aug = seq_det.augment_images([image])[0]\n","    bbs_aug = seq_det.augment_bounding_boxes([bbs])[0]\n","\n","    new_image_file = output_dir + 'dark_' + annotations[idx][2]\n","    cv2.imwrite(new_image_file, image_aug)\n","\n","    h, w = np.shape(image_aug)[0:2]\n","    voc_writer = Writer(new_image_file, w, h)\n","\n","    for i in range(len(bbs_aug.bounding_boxes)):\n","        bb_box = bbs_aug.bounding_boxes[i]\n","        voc_writer.addObject(boxes[i][0], int(bb_box.x1), int(bb_box.y1), int(bb_box.x2), int(bb_box.y2))\n","\n","    voc_writer.save(output_dir + 'dark_' + annotations[idx][1])\n","    print(output_dir + 'dark_' + annotations[idx][1])"],"execution_count":0,"outputs":[]}]}
\ No newline at end of file
--- a/code/generate_tfrecord.py 0 → 100644
View file @01f5db3
+++ b/code/generate_tfrecord.py 0 → 100644
View file @01f5db3
+"""
+Usage:
+
+# Create train data:
+python generate_tfrecord.py --label=<LABEL> --csv_input=<PATH_TO_ANNOTATIONS_FOLDER>/train_labels.csv  --output_path=<PATH_TO_ANNOTATIONS_FOLDER>/train.record <PATH_TO_ANNOTATIONS_FOLDER>/label_map.pbtxt
+
+# Create test data:
+python generate_tfrecord.py --label=<LABEL> --csv_input=<PATH_TO_ANNOTATIONS_FOLDER>/test_labels.csv  --output_path=<PATH_TO_ANNOTATIONS_FOLDER>/test.record  --label_map <PATH_TO_ANNOTATIONS_FOLDER>/label_map.pbtxt
+"""
+
+from __future__ import division
+from __future__ import print_function
+from __future__ import absolute_import
+
+import os
+import io
+import pandas as pd
+import tensorflow as tf
+import sys
+
+sys.path.append("../../models/research")
+
+from PIL import Image
+from object_detection.utils import dataset_util
+from collections import namedtuple, OrderedDict
+
+flags = tf.app.flags
+flags.DEFINE_string("csv_input", "", "Path to the CSV input")
+flags.DEFINE_string("output_path", "", "Path to output TFRecord")
+flags.DEFINE_string(
+    "label_map",
+    "",
+    "Path to the `label_map.pbtxt` contains the <class_name>:<class_index> pairs generated by `xml_to_csv.py` or manually.",
+)
+# if your image has more labels input them as
+# flags.DEFINE_string('label0', '', 'Name of class[0] label')
+# flags.DEFINE_string('label1', '', 'Name of class[1] label')
+# and so on.
+flags.DEFINE_string("img_path", "", "Path to images")
+FLAGS = flags.FLAGS
+
+
+def split(df, group):
+    data = namedtuple("data", ["filename", "object"])
+    gb = df.groupby(group)
+    return [
+        data(filename, gb.get_group(x))
+        for filename, x in zip(gb.groups.keys(), gb.groups)
+    ]
+
+
+def create_tf_example(group, path, label_map):
+    with tf.gfile.GFile(os.path.join(path, "{}".format(group.filename)), "rb") as fid:
+        encoded_jpg = fid.read()
+    encoded_jpg_io = io.BytesIO(encoded_jpg)
+    image = Image.open(encoded_jpg_io)
+    width, height = image.size
+
+    filename = group.filename.encode("utf8")
+    image_format = b"jpg"
+    # check if the image format is matching with your images.
+    xmins = []
+    xmaxs = []
+    ymins = []
+    ymaxs = []
+    classes_text = []
+    classes = []
+
+    for index, row in group.object.iterrows():
+        xmins.append(row["xmin"] / width)
+        xmaxs.append(row["xmax"] / width)
+        ymins.append(row["ymin"] / height)
+        ymaxs.append(row["ymax"] / height)
+        classes_text.append(row["class"].encode("utf8"))
+        class_index = label_map.get(row["class"])
+        assert (
+            class_index is not None
+        ), "class label: `{}` not found in label_map: {}".format(
+            row["class"], label_map
+        )
+        classes.append(class_index)
+
+    tf_example = tf.train.Example(
+        features=tf.train.Features(
+            feature={
+                "image/height": dataset_util.int64_feature(height),
+                "image/width": dataset_util.int64_feature(width),
+                "image/filename": dataset_util.bytes_feature(filename),
+                "image/source_id": dataset_util.bytes_feature(filename),
+                "image/encoded": dataset_util.bytes_feature(encoded_jpg),
+                "image/format": dataset_util.bytes_feature(image_format),
+                "image/object/bbox/xmin": dataset_util.float_list_feature(xmins),
+                "image/object/bbox/xmax": dataset_util.float_list_feature(xmaxs),
+                "image/object/bbox/ymin": dataset_util.float_list_feature(ymins),
+                "image/object/bbox/ymax": dataset_util.float_list_feature(ymaxs),
+                "image/object/class/text": dataset_util.bytes_list_feature(
+                    classes_text
+                ),
+                "image/object/class/label": dataset_util.int64_list_feature(classes),
+            }
+        )
+    )
+    return tf_example
+
+
+def main(_):
+    writer = tf.python_io.TFRecordWriter(FLAGS.output_path)
+    path = os.path.join(os.getcwd(), FLAGS.img_path)
+    examples = pd.read_csv(FLAGS.csv_input)
+
+    # Load the `label_map` from pbtxt file.
+    from object_detection.utils import label_map_util
+
+    label_map = label_map_util.load_labelmap(FLAGS.label_map)
+    categories = label_map_util.convert_label_map_to_categories(
+        label_map, max_num_classes=90, use_display_name=True
+    )
+    category_index = label_map_util.create_category_index(categories)
+    label_map = {}
+    for k, v in category_index.items():
+        label_map[v.get("name")] = v.get("id")
+    grouped = split(examples, "filename")
+    for group in grouped:
+        tf_example = create_tf_example(group, path, label_map)
+        writer.write(tf_example.SerializeToString())
+
+    writer.close()
+    output_path = os.path.join(os.getcwd(), FLAGS.output_path)
+    print("Successfully created the TFRecords: {}".format(output_path))
+
+
+if __name__ == "__main__":
+    tf.app.run()
--- a/code/object_detection.ipynb 0 → 100644
View file @01f5db3
+++ b/code/object_detection.ipynb 0 → 100644
View file @01f5db3
--- a/code/txt_to_csv.ipynb 0 → 100644
View file @01f5db3
+++ b/code/txt_to_csv.ipynb 0 → 100644
View file @01f5db3
--- a/code/xml_to_csv.py 0 → 100644
View file @01f5db3
+++ b/code/xml_to_csv.py 0 → 100644
View file @01f5db3
+"""
+Usage:
+# Create train data:
+python xml_to_csv.py -i [PATH_TO_IMAGES_FOLDER]/train -o [PATH_TO_ANNOTATIONS_FOLDER]/train_labels.csv
+
+# Create test data:
+python xml_to_csv.py -i [PATH_TO_IMAGES_FOLDER]/test -o [PATH_TO_ANNOTATIONS_FOLDER]/test_labels.csv
+"""
+
+import os
+import glob
+import pandas as pd
+import argparse
+import xml.etree.ElementTree as ET
+
+
+def xml_to_csv(path):
+    """Iterates through all .xml files (generated by labelImg) in a given directory and combines them in a single Pandas datagrame.
+
+    Parameters:
+    ----------
+    path : {str}
+        The path containing the .xml files
+    Returns
+    -------
+    Pandas DataFrame
+        The produced dataframe
+    """
+    classes_names = []
+    xml_list = []
+    for xml_file in glob.glob(path + "/*.xml"):
+        tree = ET.parse(xml_file)
+        root = tree.getroot()
+        for member in root.findall("object"):
+            classes_names.append(member[0].text)
+            value = (
+                root.find("filename").text,
+                int(root.find("size")[0].text),
+                int(root.find("size")[1].text),
+                member[0].text,
+                int(member[4][0].text),
+                int(member[4][1].text),
+                int(member[4][2].text),
+                int(member[4][3].text),
+            )
+            xml_list.append(value)
+    column_name = [
+        "filename",
+        "width",
+        "height",
+        "class",
+        "xmin",
+        "ymin",
+        "xmax",
+        "ymax",
+    ]
+    xml_df = pd.DataFrame(xml_list, columns=column_name)
+    classes_names = list(set(classes_names))
+    classes_names.sort()
+    return xml_df, classes_names
+
+
+def main():
+    # Initiate argument parser
+    parser = argparse.ArgumentParser(
+        description="Sample TensorFlow XML-to-CSV converter"
+    )
+    parser.add_argument(
+        "-i",
+        "--inputDir",
+        help="Path to the folder where the input .xml files are stored",
+        type=str,
+    )
+    parser.add_argument(
+        "-o", "--outputFile", help="Name of output .csv file (including path)", type=str
+    )
+
+    parser.add_argument(
+        "-l",
+        "--labelMapDir",
+        help="Directory path to save label_map.pbtxt file is specified.",
+        type=str,
+        default="",
+    )
+
+    args = parser.parse_args()
+
+    if args.inputDir is None:
+        args.inputDir = os.getcwd()
+    if args.outputFile is None:
+        args.outputFile = args.inputDir + "/labels.csv"
+
+    assert os.path.isdir(args.inputDir)
+    os.makedirs(os.path.dirname(args.outputFile), exist_ok=True)
+    xml_df, classes_names = xml_to_csv(args.inputDir)
+    xml_df.to_csv(args.outputFile, index=None)
+    print("Successfully converted xml to csv.")
+    if args.labelMapDir:
+        os.makedirs(args.labelMapDir, exist_ok=True)
+        label_map_path = os.path.join(args.labelMapDir, "label_map.pbtxt")
+        print("Generate `{}`".format(label_map_path))
+
+        # Create the `label_map.pbtxt` file
+        pbtxt_content = ""
+        for i, class_name in enumerate(classes_names):
+            pbtxt_content = (
+                pbtxt_content
+                + "item {{\n    id: {0}\n    name: '{1}'\n}}\n\n".format(
+                    i + 1, class_name
+                )
+            )
+        pbtxt_content = pbtxt_content.strip()
+        with open(label_map_path, "w") as f:
+            f.write(pbtxt_content)
+
+
+if __name__ == "__main__":
+    main()