add codes

최지우
Commit df4c2a749429aad5dad827c1a7be4603402992f6 df4c2a74 1 parent 1c7edc0e
Showing 21 changed files with 895 additions and 0 deletions
Code/detection.py
Code/keras_test.py
Code/main.py
Code/model_data/box_yolo.h5
Code/model_data/coco_classes.txt
Code/model_data/tiny_yolo_anchors.txt
Code/model_data/voc_classes.txt
Code/model_data/yolo_anchors.txt
Code/model_data/yolo_tiny.h5
Code/model_data/yolo_tiny_best.h5
Code/myform.jpg
Code/obj.data
Code/obj.names
Code/ocr_image.py
Code/ocrtest.py
Code/opencvlib.py
Code/rotate_image.py
Code/yolo.py
Code/yolov3-tiny.cfg
Code/yolov3-tiny_best.weights
--- a/Code/detection.py 0 → 100644
View file @df4c2a7
+++ b/Code/detection.py 0 → 100644
View file @df4c2a7
+ import cv2
+ import numpy as np
+ import serial
+ 
+ # 웹캠 신호 받기
+ VideoSignal = cv2.VideoCapture(0)
+ # YOLO 가중치 파일과 CFG 파일 로드
+ YOLO_net = cv2.dnn.readNet('yolov3-tiny_last.weights','yolov3-tiny.cfg')
+ 
+ # YOLO NETWORK 재구성
+ classes = []
+ with open("obj.names", "r") as f:
+     classes = [line.strip() for line in f.readlines()]
+ layer_names = YOLO_net.getLayerNames()
+ output_layers = [layer_names[i[0] - 1] for i in YOLO_net.getUnconnectedOutLayers()]
+ 
+ while True:
+     # 웹캠 프레임
+     ret, frame = VideoSignal.read()
+     h, w, c = frame.shape
+ 
+ 
+     # YOLO 입력
+     blob = cv2.dnn.blobFromImage(frame, 0.00392, (416, 416), (0, 0, 0),
+     True, crop=False)
+     YOLO_net.setInput(blob)
+     outs = YOLO_net.forward(output_layers)
+ 
+     class_ids = []
+     confidences = []
+     boxes = []
+ 
+     for out in outs:
+ 
+         for detection in out:
+ 
+             scores = detection[5:]
+             class_id = np.argmax(scores)
+             confidence = scores[class_id]
+ 
+             if confidence > 0.3:
+                 # Object detected
+                 center_x = int(detection[0] * w)
+                 center_y = int(detection[1] * h)
+                 dw = int(detection[2] * w)
+                 dh = int(detection[3] * h)
+                 # Rectangle coordinate
+                 x = int(center_x - dw / 2)
+                 y = int(center_y - dh / 2)
+                 boxes.append([x, y, dw, dh])
+                 confidences.append(float(confidence))
+                 class_ids.append(class_id)
+ 
+     indexes = cv2.dnn.NMSBoxes(boxes, confidences, 0.45, 0.4)
+     
+         
+ 
+     for i in range(len(boxes)):
+         if i in indexes:
+             x, y, w, h = boxes[i]
+             label = 'box'
+             score = confidences[i]
+ 
+             # 경계상자와 클래스 정보 이미지에 입력
+             cv2.rectangle(frame, (x, y), (x + w, y + h), (0, 0, 255), 5)
+             cv2.putText(frame, label, (x, y - 20), cv2.FONT_ITALIC, 0.5, 
+             (255, 255, 255), 1)
+ 
+     cv2.imshow("YOLOv3", frame)
+ 
+     if cv2.waitKey(100) > 0:
+         break
--- a/Code/keras_test.py 0 → 100644
View file @df4c2a7
+++ b/Code/keras_test.py 0 → 100644
View file @df4c2a7
+ from IPython.display import display
+ from PIL import Image
+ from yolo import YOLO
+ import cvlib as cv
+ from cvlib.object_detection import draw_bbox
+ import cv2
+ import tensorflow.compat.v1.keras.backend as K
+ import tensorflow as tf
+ tf.compat.v1.disable_eager_execution()
+ 
+ def objectDetection(file, model_path, class_path):
+     yolo = YOLO(model_path=model_path, classes_path=class_path, anchors_path='model_data/tiny_yolo_anchors.txt')
+     image = Image.open(file)
+     result_image = yolo.detect_image(image)
+     result_image.save('test.jpg','JPEG')
+ 
+ webcam = cv2.VideoCapture(0)
+ 
+ if not webcam.isOpened():
+     print("Could not open webcam")
+     exit()
+     
+ yolo = YOLO(model_path='model_data/yolo_tiny_best.h5', classes_path='data/box/classes.txt', anchors_path='model_data/tiny_yolo_anchors.txt')
+ 
+ # loop through frames
+ while webcam.isOpened():
+     status, frame = webcam.read()
+ 
+     if not status:
+         break
+     '''
+     cv2.imwrite('frame.jpg', frame)
+     objectDetection('frame.jpg', 'model_data/yolo_tiny_best.h5', 'data/box/classes.txt')
+     out = cv2.imread('test.jpg')
+     '''
+     cv2.imwrite('frame.jpg', frame)
+     tst = Image.open('frame.jpg')
+     out = yolo.detect_image(tst)
+     out.save('test.jpg', 'JPEG')
+     out = cv2.imread('test.jpg')
+     cv2.imshow("Real-time object detection", out)
+     if cv2.waitKey(1) & 0xFF == ord('q'):
+         break
+ 
+ webcam.release()
+ cv2.destroyAllWindows()
+ 
+ 
--- a/Code/main.py 0 → 100644
View file @df4c2a7
+++ b/Code/main.py 0 → 100644
View file @df4c2a7
+ import serial
+ import cv2
+ import numpy as np
+ import ocr_image
+ 
+ ser = serial.Serial('/dev/ttyAMA0',115200)
+ if(ser.isOpen()):
+ 	print("Serial Communication in operation")
+ 
+ LiveCam = cv2.VideoCapture(0)
+ YOLO_net = cv2.dnn.readNet('yolov3-tiny_best.weights','yolov3-tiny.cfg')
+ 
+ classes = ['box']
+ layer_names = YOLO_net.getLayerNames()
+ output_layers = [layer_names[i[0] - 1] for i in YOLO_net.getUnconnectedOutLayers()]
+ 
+ frame_num = 0
+ 
+ while LiveCam.isOpened():
+     ret, frame = LiveCam.read()
+     if ret is False:
+         print("No Video Input")
+         break
+     if frame_num != 20:
+         frame_num += 1
+     elif frame_num == 20:
+         frame_num = 0
+ 
+         h, w, c = frame.shape
+        
+         blob = cv2.dnn.blobFromImage(frame, 0.00392, (416, 416), (0, 0, 0), True, crop=False)
+         YOLO_net.setInput(blob)
+         outs = YOLO_net.forward(output_layers)
+ 
+         class_ids = []
+         confidences = []
+         boxes = []
+ 
+         for out in outs:
+ 
+             for detection in out:
+ 
+                 scores = detection[5:]
+                 class_id = np.argmax(scores)
+                 confidence = scores[class_id]
+ 
+                 if confidence > 0.4:
+                     center_x = int(detection[0] * w)
+                     center_y = int(detection[1] * h)
+                     dw = int(detection[2] * w)
+                     dh = int(detection[3] * h)
+                     x = int(center_x - dw / 2)
+                     y = int(center_y - dh / 2)
+                     boxes.append([x, y, dw, dh])
+                     confidences.append(float(confidence))
+                     class_ids.append(class_id)
+ 
+         indexes = cv2.dnn.NMSBoxes(boxes, confidences, 0.45, 0.4)
+ 
+        
+         if confidences:
+             bestscore = confidences.index(max(confidences))
+             best_x, best_y, best_w, best_h = boxes[bestscore]
+             
+             if best_x > 320 :
+                 print("오른쪽으로 이동")
+                 ser.write(serial.to_bytes([int('1',16)]))
+ 
+             elif best_x + best_w < 320 :
+                 print("왼쪽으로 이동")
+                 ser.write(serial.to_bytes([int('2',16)]))
+ 
+             else :
+                 print("직진")
+                 cv2.imwrite('cap_img.jpg', frame)
+                 ser.write(serial.to_bytes([int('3',16)]))
+                 break
+ 
+             cv2.rectangle(frame, (best_x, best_y), (best_x + best_w, best_y + best_h), (0, 0, 255), 5)
+             cv2.putText(frame, 'box', (best_x, best_y - 20), cv2.FONT_ITALIC, 0.5, (255, 255, 255), 1)
+ 
+         cv2.imshow("YOLOv3", frame)
+ 
+         if cv2.waitKey(100) > 0:
+             break
+ '''
+ image = cv2.imread("cap_img.jpg")
+ template = cv2.imread("myform.jpg")
+ 
+ ocr_result = ocr_form.ocr(image, template)
+ 
+ (name, result) = ocr_result["name"]
+ (address, result) = ocr_result["address"]
+ (detail_address, result) = ocr_result["detail_address"]
+ 
+ name = name.replace(" ","")
+ address = address.replace(" ","")
+ detail_address = detail_address.replace(" ","")
+ 
+ print(name)
+ print(address)
+ print(detail_address)
+ 
+ '''
--- a/Code/model_data/box_yolo.h5 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/box_yolo.h5 0 → 100644
View file @df4c2a7
--- a/Code/model_data/coco_classes.txt 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/coco_classes.txt 0 → 100644
View file @df4c2a7
+ person
+ bicycle
+ car
+ motorbike
+ aeroplane
+ bus
+ train
+ truck
+ boat
+ traffic light
+ fire hydrant
+ stop sign
+ parking meter
+ bench
+ bird
+ cat
+ dog
+ horse
+ sheep
+ cow
+ elephant
+ bear
+ zebra
+ giraffe
+ backpack
+ umbrella
+ handbag
+ tie
+ suitcase
+ frisbee
+ skis
+ snowboard
+ sports ball
+ kite
+ baseball bat
+ baseball glove
+ skateboard
+ surfboard
+ tennis racket
+ bottle
+ wine glass
+ cup
+ fork
+ knife
+ spoon
+ bowl
+ banana
+ apple
+ sandwich
+ orange
+ broccoli
+ carrot
+ hot dog
+ pizza
+ donut
+ cake
+ chair
+ sofa
+ pottedplant
+ bed
+ diningtable
+ toilet
+ tvmonitor
+ laptop
+ mouse
+ remote
+ keyboard
+ cell phone
+ microwave
+ oven
+ toaster
+ sink
+ refrigerator
+ book
+ clock
+ vase
+ scissors
+ teddy bear
+ hair drier
+ toothbrush
--- a/Code/model_data/tiny_yolo_anchors.txt 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/tiny_yolo_anchors.txt 0 → 100644
View file @df4c2a7
+ 10,14,  23,27,  37,58,  81,82,  135,169,  344,319
--- a/Code/model_data/voc_classes.txt 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/voc_classes.txt 0 → 100644
View file @df4c2a7
+ aeroplane
+ bicycle
+ bird
+ boat
+ bottle
+ bus
+ car
+ cat
+ chair
+ cow
+ diningtable
+ dog
+ horse
+ motorbike
+ person
+ pottedplant
+ sheep
+ sofa
+ train
+ tvmonitor
--- a/Code/model_data/yolo_anchors.txt 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/yolo_anchors.txt 0 → 100644
View file @df4c2a7
+ 10,13,  16,30,  33,23,  30,61,  62,45,  59,119,  116,90,  156,198,  373,326
--- a/Code/model_data/yolo_tiny.h5 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/yolo_tiny.h5 0 → 100644
View file @df4c2a7
--- a/Code/model_data/yolo_tiny_best.h5 0 → 100644
View file @df4c2a7
+++ b/Code/model_data/yolo_tiny_best.h5 0 → 100644
View file @df4c2a7
--- a/Code/myform.jpg 0 → 100644
View file @df4c2a7
+++ b/Code/myform.jpg 0 → 100644
View file @df4c2a7
--- a/Code/obj.data 0 → 100644
View file @df4c2a7
+++ b/Code/obj.data 0 → 100644
View file @df4c2a7
+ classes = 1
+ train = data/train.txt
+ valid = data/train.txt
+ names = data/obj.names
+ backup = backup/
+ 
--- a/Code/obj.names 0 → 100644
View file @df4c2a7
+++ b/Code/obj.names 0 → 100644
View file @df4c2a7
+ box
\ No newline at end of file
--- a/Code/ocr_image.py 0 → 100644
View file @df4c2a7
+++ b/Code/ocr_image.py 0 → 100644
View file @df4c2a7
+ import rotate_image
+ from collections import namedtuple
+ import pytesseract
+ import argparse
+ import imutils
+ import cv2
+ 
+ def ocr(image, template) :
+     print("[Loading...] OCR Location Setting")
+ 
+     OCRLocation = namedtuple("OCRLocation", ["id", "bbox", "filter_keywords"])
+ 
+     OCR_Locations = [
+         OCRLocation("name", (27, 96, 60, 20), []),
+         OCRLocation("address", (27, 115, 276, 21), []),
+         OCRLocation("detail_address", (28, 134, 409, 36), []),
+     ]
+ 
+     print("[Loading...] aligning images")
+     aligned = rotate_image.rotate_image(image, template)
+ 
+     print("[Loading...] Proceeding OCR")
+     parsingResults = []
+ 
+     for loc in OCR_Locations:
+         (x, y, w, h) = loc.bbox
+         roi = aligned[y:y+h, x:x+w]
+         cv2.imshow(loc.id, roi)
+         cv2.waitKey(0)
+     
+         rgb = cv2.cvtColor(roi, cv2.COLOR_BGR2RGB)
+         text = pytesseract.image_to_string(rgb, lang='Hangul')
+     
+         for line in text.split("\n"):
+             if len(line) == 0:
+                 continue
+ 
+             lower = line.lower()
+             count = sum([lower.count(x) for x in loc.filter_keywords])
+ 
+             if count == 0:
+                 parsingResults.append((loc, line))
+     
+     results = {}
+ 
+     for (loc, line) in parsingResults:
+         r = results.get(loc.id, None)
+ 
+         if r is None:
+             results[loc.id] = (line, loc._asdict())
+     
+         else:
+             (existingText, loc) = r
+             text = "{}\n{}".format(existingText, line)
+ 
+             results[loc["id"]] = (text, loc)
+ 
+     for (locID, result) in results.items():
+         (text, loc) = result
+ 
+         print(loc["id"])
+         print("=" * len(loc["id"]))
+         print("{}\n".format(text))
+ 
+     cv2.imshow("Input", imutils.resize(image))
+     cv2.imshow("Output", imutils.resize(aligned))
+     cv2.waitKey(0)
+     
+     return results
--- a/Code/ocrtest.py 0 → 100644
View file @df4c2a7
+++ b/Code/ocrtest.py 0 → 100644
View file @df4c2a7
+ import cv2
+ import numpy as np
+ import ocr_form
+ 
+ image = cv2.imread("myimg1.png")
+ template = cv2.imread("myform.jpg")
+ 
+ ocr_result = ocr_form.ocr(image, template)
+ 
+ (name, result) = ocr_result["name"]
+ (address, result) = ocr_result["address"]
+ (detail_address, result) = ocr_result["detail_address"]
+ 
+ name = name.replace(" ","")
+ address = address.replace(" ","")
+ detail_address = detail_address.replace(" ","")
+ 
+ print(name)
+ print(address)
+ print(detail_address)
--- a/Code/opencvlib.py 0 → 100644
View file @df4c2a7
+++ b/Code/opencvlib.py 0 → 100644
View file @df4c2a7
+ # import necessary packages
+ import cvlib as cv
+ from cvlib.object_detection import draw_bbox
+ import cv2
+ 
+ # open webcam (웹캠 열기)
+ webcam = cv2.VideoCapture(0)
+ 
+ if not webcam.isOpened():
+     print("Could not open webcam")
+     exit()
+     
+ 
+ # loop through frames
+ while webcam.isOpened():
+ 
+     # read frame from webcam 
+     status, frame = webcam.read()
+ 
+     if not status:
+         break
+ 
+     # apply object detection (물체 검출)
+     bbox, label, conf = cv.detect_common_objects(frame)
+ 
+     # draw bounding box over detected objects (검출된 물체 가장자리에 바운딩 박스 그리기)
+     out = draw_bbox(frame, bbox, label, conf, write_conf=True)
+ 
+     # display output
+     cv2.imshow("Real-time object detection", out)
+ 
+     # press "Q" to stop
+     if cv2.waitKey(1) & 0xFF == ord('q'):
+         break
+     
+ # release resources
+ webcam.release()
+ cv2.destroyAllWindows()
--- a/Code/rotate_image.py 0 → 100644
View file @df4c2a7
+++ b/Code/rotate_image.py 0 → 100644
View file @df4c2a7
+ import numpy as np
+ import imutils
+ import cv2
+ 
+ def rotate_image(image, template, maxFeatures=500, keepPercent=0.2, debug=False):
+     gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+     gray_template = cv2.cvtColor(template, cv2.COLOR_BGR2GRAY)
+     
+     orb = cv2.ORB_create(maxFeatures)
+     (kpsA, descsA) = orb.detectAndCompute(gray_image, None)
+     (kpsB, descsB) = orb.detectAndCompute(gray_template, None)
+     
+     method = cv2.DESCRIPTOR_MATCHER_BRUTEFORCE_HAMMING
+     matcher = cv2.DescriptorMatcher_create(method)
+     matches = matcher.match(descsA, descsB, None)
+ 
+     matches = sorted(matches, key=lambda x: x.distance)
+ 
+     keep = int(len(matches) * keepPercent)
+     matches = matches[:keep]
+ 
+     if debug:
+         matchedVis = cv2.drawMatches(image, kpsA, template, kpsB, matches, None)
+         matchedVis = imutils.resize(matchedVis, width=1000)
+         cv2.imshow("Matched Keypoints", matchedVis)
+         cv2.waitKey(0)
+     
+     ptsA = np.zeros((len(matches), 2), dtype=float)
+     ptsB = np.zeros((len(matches), 2), dtype=float)
+ 
+     for (i, m) in enumerate(matches):
+         ptsA[i] = kpsA[m.queryIdx].pt
+         ptsB[i] = kpsB[m.trainIdx].pt
+     
+     (H, mask) = cv2.findHomography(ptsA, ptsB, method=cv2.RANSAC)
+ 
+     (h, w) = template.shape[:2]
+     aligned = cv2.warpPerspective(image, H, (w, h))
+ 
+     return aligned
--- a/Code/yolo.py 0 → 100644
View file @df4c2a7
+++ b/Code/yolo.py 0 → 100644
View file @df4c2a7
+ # -*- coding: utf-8 -*-
+ """
+ Class definition of YOLO_v3 style detection model on image and video
+ """
+ 
+ import colorsys
+ import os
+ from timeit import default_timer as timer
+ 
+ import numpy as np
+ from keras import backend as K
+ from keras.models import load_model
+ from keras.layers import Input
+ from PIL import Image, ImageFont, ImageDraw
+ from tensorflow.compat.v1.keras import backend as K 
+ 
+ from yolo3.model import yolo_eval, yolo_body, tiny_yolo_body
+ from yolo3.utils import letterbox_image
+ import os
+ from keras.utils import multi_gpu_model
+ 
+ class YOLO(object):
+     _defaults = {
+         "model_path": 'model_data/yolo.h5',
+         "anchors_path": 'model_data/yolo_anchors.txt',
+         "classes_path": 'model_data/coco_classes.txt',
+         "score" : 0.3,
+         "iou" : 0.45,
+         "model_image_size" : (416, 416),
+         "gpu_num" : 1,
+     }
+ 
+     @classmethod
+     def get_defaults(cls, n):
+         if n in cls._defaults:
+             return cls._defaults[n]
+         else:
+             return "Unrecognized attribute name '" + n + "'"
+ 
+     def __init__(self, **kwargs):
+         self.__dict__.update(self._defaults) # set up default values
+         self.__dict__.update(kwargs) # and update with user overrides
+         self.class_names = self._get_class()
+         self.anchors = self._get_anchors()
+         self.sess = K.get_session()
+         self.boxes, self.scores, self.classes = self.generate()
+ 
+     def _get_class(self):
+         classes_path = os.path.expanduser(self.classes_path)
+         with open(classes_path) as f:
+             class_names = f.readlines()
+         class_names = [c.strip() for c in class_names]
+         return class_names
+ 
+     def _get_anchors(self):
+         anchors_path = os.path.expanduser(self.anchors_path)
+         with open(anchors_path) as f:
+             anchors = f.readline()
+         anchors = [float(x) for x in anchors.split(',')]
+         return np.array(anchors).reshape(-1, 2)
+ 
+     def generate(self):
+         model_path = os.path.expanduser(self.model_path)
+         assert model_path.endswith('.h5'), 'Keras model or weights must be a .h5 file.'
+ 
+         # Load model, or construct model and load weights.
+         num_anchors = len(self.anchors)
+         num_classes = len(self.class_names)
+         is_tiny_version = num_anchors==6 # default setting
+         try:
+             self.yolo_model = load_model(model_path, compile=False)
+         except:
+             self.yolo_model = tiny_yolo_body(Input(shape=(None,None,3)), num_anchors//2, num_classes) \
+                 if is_tiny_version else yolo_body(Input(shape=(None,None,3)), num_anchors//3, num_classes)
+             self.yolo_model.load_weights(self.model_path) # make sure model, anchors and classes match
+         else:
+             assert self.yolo_model.layers[-1].output_shape[-1] == \
+                 num_anchors/len(self.yolo_model.output) * (num_classes + 5), \
+                 'Mismatch between model and given anchor and class sizes'
+ 
+         print('{} model, anchors, and classes loaded.'.format(model_path))
+ 
+         # Generate colors for drawing bounding boxes.
+         hsv_tuples = [(x / len(self.class_names), 1., 1.)
+                       for x in range(len(self.class_names))]
+         self.colors = list(map(lambda x: colorsys.hsv_to_rgb(*x), hsv_tuples))
+         self.colors = list(
+             map(lambda x: (int(x[0] * 255), int(x[1] * 255), int(x[2] * 255)),
+                 self.colors))
+         np.random.seed(10101)  # Fixed seed for consistent colors across runs.
+         np.random.shuffle(self.colors)  # Shuffle colors to decorrelate adjacent classes.
+         np.random.seed(None)  # Reset seed to default.
+ 
+         # Generate output tensor targets for filtered bounding boxes.
+         self.input_image_shape = K.placeholder(shape=(2, ))
+         if self.gpu_num>=2:
+             self.yolo_model = multi_gpu_model(self.yolo_model, gpus=self.gpu_num)
+         boxes, scores, classes = yolo_eval(self.yolo_model.output, self.anchors,
+                 len(self.class_names), self.input_image_shape,
+                 score_threshold=self.score, iou_threshold=self.iou)
+         return boxes, scores, classes
+ 
+     def detect_image(self, image):
+         start = timer()
+ 
+         if self.model_image_size != (None, None):
+             assert self.model_image_size[0]%32 == 0, 'Multiples of 32 required'
+             assert self.model_image_size[1]%32 == 0, 'Multiples of 32 required'
+             boxed_image = letterbox_image(image, tuple(reversed(self.model_image_size)))
+         else:
+             new_image_size = (image.width - (image.width % 32),
+                               image.height - (image.height % 32))
+             boxed_image = letterbox_image(image, new_image_size)
+         image_data = np.array(boxed_image, dtype='float32')
+ 
+         print(image_data.shape)
+         image_data /= 255.
+         image_data = np.expand_dims(image_data, 0)  # Add batch dimension.
+ 
+         out_boxes, out_scores, out_classes = self.sess.run(
+             [self.boxes, self.scores, self.classes],
+             feed_dict={
+                 self.yolo_model.input: image_data,
+                 self.input_image_shape: [image.size[1], image.size[0]],
+                 K.learning_phase(): 0
+             })
+ 
+         print('Found {} boxes for {}'.format(len(out_boxes), 'img'))
+ 
+         font = ImageFont.truetype(font='font/FiraMono-Medium.otf',
+                     size=np.floor(3e-2 * image.size[1] + 0.5).astype('int32'))
+         thickness = (image.size[0] + image.size[1]) // 300
+ 
+         for i, c in reversed(list(enumerate(out_classes))):
+             predicted_class = self.class_names[c]
+             box = out_boxes[i]
+             score = out_scores[i]
+ 
+             label = '{} {:.2f}'.format(predicted_class, score)
+             draw = ImageDraw.Draw(image)
+             label_size = draw.textsize(label, font)
+ 
+             top, left, bottom, right = box
+             top = max(0, np.floor(top + 0.5).astype('int32'))
+             left = max(0, np.floor(left + 0.5).astype('int32'))
+             bottom = min(image.size[1], np.floor(bottom + 0.5).astype('int32'))
+             right = min(image.size[0], np.floor(right + 0.5).astype('int32'))
+             print(label, (left, top), (right, bottom))
+ 
+             if top - label_size[1] >= 0:
+                 text_origin = np.array([left, top - label_size[1]])
+             else:
+                 text_origin = np.array([left, top + 1])
+ 
+             # My kingdom for a good redistributable image drawing library.
+             for i in range(thickness):
+                 draw.rectangle(
+                     [left + i, top + i, right - i, bottom - i],
+                     outline=self.colors[c])
+             draw.rectangle(
+                 [tuple(text_origin), tuple(text_origin + label_size)],
+                 fill=self.colors[c])
+             draw.text(text_origin, label, fill=(0, 0, 0), font=font)
+             del draw
+ 
+         end = timer()
+         print(end - start)
+         return image
+ 
+     def close_session(self):
+         self.sess.close()
+ 
+ def detect_video(yolo, video_path, output_path=""):
+     import cv2
+     vid = cv2.VideoCapture(video_path)
+     if not vid.isOpened():
+         raise IOError("Couldn't open webcam or video")
+     video_FourCC    = int(vid.get(cv2.CAP_PROP_FOURCC))
+     video_fps       = vid.get(cv2.CAP_PROP_FPS)
+     video_size      = (int(vid.get(cv2.CAP_PROP_FRAME_WIDTH)),
+                         int(vid.get(cv2.CAP_PROP_FRAME_HEIGHT)))
+     isOutput = True if output_path != "" else False
+     if isOutput:
+         print("!!! TYPE:", type(output_path), type(video_FourCC), type(video_fps), type(video_size))
+         out = cv2.VideoWriter(output_path, video_FourCC, video_fps, video_size)
+     accum_time = 0
+     curr_fps = 0
+     fps = "FPS: ??"
+     prev_time = timer()
+     while True:
+         return_value, frame = vid.read()
+         image = Image.fromarray(frame)
+         image = yolo.detect_image(image)
+         result = np.asarray(image)
+         curr_time = timer()
+         exec_time = curr_time - prev_time
+         prev_time = curr_time
+         accum_time = accum_time + exec_time
+         curr_fps = curr_fps + 1
+         if accum_time > 1:
+             accum_time = accum_time - 1
+             fps = "FPS: " + str(curr_fps)
+             curr_fps = 0
+         cv2.putText(result, text=fps, org=(3, 15), fontFace=cv2.FONT_HERSHEY_SIMPLEX,
+                     fontScale=0.50, color=(255, 0, 0), thickness=2)
+         cv2.namedWindow("result", cv2.WINDOW_NORMAL)
+         cv2.imshow("result", result)
+         if isOutput:
+             out.write(result)
+         if cv2.waitKey(1) & 0xFF == ord('q'):
+             break
+     yolo.close_session()
+ 
--- a/Code/yolov3-tiny.cfg 0 → 100644
View file @df4c2a7
+++ b/Code/yolov3-tiny.cfg 0 → 100644
View file @df4c2a7
+ [net]
+ # Testing
+ #batch=1
+ #subdivisions=1
+ # Training
+ batch=64
+ subdivisions=8
+ width=416
+ height=416
+ channels=3
+ momentum=0.9
+ decay=0.0005
+ angle=0
+ saturation = 1.5
+ exposure = 1.5
+ hue=.1
+ 
+ learning_rate=0.001
+ burn_in=1000
+ max_batches = 500200
+ policy=steps
+ steps=400000,450000
+ scales=.1,.1
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=16
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=2
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=32
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=2
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=64
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=2
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=128
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=2
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=256
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=2
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=512
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [maxpool]
+ size=2
+ stride=1
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=1024
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ ###########
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=256
+ size=1
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=512
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [convolutional]
+ size=1
+ stride=1
+ pad=1
+ filters=18
+ activation=linear
+ 
+ 
+ 
+ [yolo]
+ mask = 3,4,5
+ anchors = 54,245,  53,266,  60,253,  58,271,  62,270,  66,258,  68,280,  73,266
+ classes=1
+ num=8
+ jitter=.3
+ ignore_thresh = .7
+ truth_thresh = 1
+ random=1
+ 
+ [route]
+ layers = -4
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=128
+ size=1
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [upsample]
+ stride=2
+ 
+ [route]
+ layers = -1, 8
+ 
+ [convolutional]
+ batch_normalize=1
+ filters=256
+ size=3
+ stride=1
+ pad=1
+ activation=leaky
+ 
+ [convolutional]
+ size=1
+ stride=1
+ pad=1
+ filters=18
+ activation=linear
+ 
+ [yolo]
+ mask = 0,1,2
+ anchors = 54,245,  53,266,  60,253,  58,271,  62,270,  66,258,  68,280,  73,266
+ classes=1
+ num=8
+ jitter=.3
+ ignore_thresh = .7
+ truth_thresh = 1
+ random=1
--- a/Code/yolov3-tiny_best.weights 0 → 100644
View file @df4c2a7
+++ b/Code/yolov3-tiny_best.weights 0 → 100644
View file @df4c2a7
--- a/Code/yolov3-tiny_last.weights 0 → 100644
View file @df4c2a7
+++ b/Code/yolov3-tiny_last.weights 0 → 100644
View file @df4c2a7