Merge branch 'master' of http://khuhub.khu.ac.kr/2021-1-capstone-design2/2017103972

김성연
Commit fea4c30aac49316c70ab6747b9dbe915a69dfe53 fea4c30a 2 parents 2023e7ac d0007ba8
Showing 5 changed files with 317 additions and 1 deletions
code/simple_face_recognition
code/videoTest/matrix_face_recognition.ipynb
code/videoTest/video.py
code/videoTest/video2.py
code/videoTest/video3.py
--- a/simple_face_recognition @ 0066cd85
+++ b/simple_face_recognition @ 0066cd85
- Subproject commit 0066cd8581e59918a924357d3371b1e1298cd0e5
--- a/code/videoTest/matrix_face_recognition.ipynb 0 → 100644
View file @fea4c30
+++ b/code/videoTest/matrix_face_recognition.ipynb 0 → 100644
View file @fea4c30
--- a/code/videoTest/video.py 0 → 100644
View file @fea4c30
+++ b/code/videoTest/video.py 0 → 100644
View file @fea4c30
+ import dlib, cv2
+ import numpy as np
+ 
+ detector = dlib.get_frontal_face_detector()
+ sp = dlib.shape_predictor('models/shape_predictor_68_face_landmarks.dat')
+ facerec = dlib.face_recognition_model_v1('models/dlib_face_recognition_resnet_model_v1.dat')
+ 
+ descs = np.load('img/descs.npy', allow_pickle=True)[()]
+ 
+ def encode_face(img):
+   dets = detector(img, 1)
+ 
+   if len(dets) == 0:
+     return np.empty(0)
+ 
+   for k, d in enumerate(dets):
+     shape = sp(img, d)
+     face_descriptor = facerec.compute_face_descriptor(img, shape)
+ 
+     return np.array(face_descriptor)
+ 
+ video_path = './data/record0.mp4'
+ cap = cv2.VideoCapture(video_path)
+ 
+ if not cap.isOpened():
+   exit()
+ 
+ _, img_bgr = cap.read() # (800, 1920, 3)
+ padding_size = 0
+ resized_width = 1920
+ video_size = (resized_width, int(img_bgr.shape[0] * resized_width // img_bgr.shape[1]))
+ output_size = (resized_width, int(img_bgr.shape[0] * resized_width // img_bgr.shape[1] + padding_size * 2))
+ 
+ fourcc = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
+ writer = cv2.VideoWriter('%s_output.mp4' % (video_path.split('.')[0]), fourcc, cap.get(cv2.CAP_PROP_FPS), output_size)
+ 
+ while True:
+   ret, img_bgr = cap.read()
+   if not ret:
+     break
+ 
+   img_bgr = cv2.resize(img_bgr, video_size)
+   img_rgb = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)
+ 
+   # img_bgr = cv2.copyMakeBorder(img_bgr, top=padding_size, bottom=padding_size, left=0, right=0, borderType=cv2.BORDER_CONSTANT, value=(0,0,0))
+   
+   dets = detector(img_bgr, 1)
+ 
+   for k, d in enumerate(dets):
+     shape = sp(img_rgb, d)
+     face_descriptor = facerec.compute_face_descriptor(img_rgb, shape)
+ 
+     last_found = {'name': 'unknown', 'dist': 0.6, 'color': (0,0,255)}
+ 
+     for name, saved_desc in descs.items():
+       dist = np.linalg.norm([face_descriptor] - saved_desc, axis=1)
+ 
+       if dist < last_found['dist']:
+         last_found = {'name': name, 'dist': dist, 'color': (255,255,255)}
+ 
+     cv2.rectangle(img_bgr, pt1=(d.left(), d.top()), pt2=(d.right(), d.bottom()), color=last_found['color'], thickness=2)
+     cv2.putText(img_bgr, last_found['name'], org=(d.left(), d.top()), fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=1, color=last_found['color'], thickness=2)
+ 
+   writer.write(img_bgr)
+ 
+   cv2.imshow('img', img_bgr)
+   
+   if cv2.waitKey(1) == ord('q'):
+     break
+ 
+ cap.release()
+ writer.release()
--- a/code/videoTest/video2.py 0 → 100644
View file @fea4c30
+++ b/code/videoTest/video2.py 0 → 100644
View file @fea4c30
+ import dlib
+ import cv2
+ import numpy as np
+ import matplotlib.pyplot as plt
+ import tensorflow as tf
+ import math
+ import os
+ import pathlib
+ import time
+ import pandas as pd
+ import tensorflow as tf
+ from tensorflow.keras.preprocessing.image import ImageDataGenerator,load_img
+ from tensorflow.keras.models import load_model
+ from tensorflow.keras import regularizers
+ from tensorflow import keras
+ from imutils import face_utils
+ import time
+ 
+  
+ start = time.time()
+ detector = dlib.get_frontal_face_detector()
+ predictor = dlib.shape_predictor("./models/shape_predictor_68_face_landmarks.dat")
+ facerec = dlib.face_recognition_model_v1('models/dlib_face_recognition_resnet_model_v1.dat')
+ model = load_model('../checkpoint/er-best-mobilenet1-bt32-model-classweight-adam.h5')
+ # model = load_model('../checkpoint/er-best-mobilenet2-bt32-model-adam.h5')
+ # model = load_model('../checkpoint/er-best-efficientNet1-bt32-model-SGD.h5')
+     
+     
+ descs = np.load('img/descs2.npy', allow_pickle=True)[()]
+  
+ video_path = './data/zoom_1.mp4'
+ cap=cv2.VideoCapture(video_path)
+  
+ 
+ 
+ labels_dict_ = {0 : 'angry', 1 : 'fear' ,  2: 'happy', 3: 'neutral', 4:  'sad', 5: 'surprise'}
+ # labels_dict_ = {'angry' : 0,'fear' : 1 ,'happy' : 2, 'neutral' : 3,  'sad' : 4, 'surprise' : 5}
+ time_dict = {'angry': [], 'fear': [], 'happy': [], 'neutral': [], 'sad': [], 'surprise': []}
+ def get_key(val):
+     for key, value in labels_dict_.items():
+         if(value == val):
+             return key
+ 
+ 
+ def convertMillis(millis):
+     seconds=(millis/1000)%60 
+     minutes=(millis/(1000*60))%60
+     hours=(millis/(1000*60*60))%24
+     return seconds, int(minutes), int(hours)
+ 
+ #cap = cv2.VideoCapture(0) # 0번 카메라
+  
+ # 동영상 크기(frame정보)를 읽어옴
+ frameWidth = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+ frameHeight = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+ frame_size = (frameWidth, frameHeight)
+ fps = cap.get((cv2.CAP_PROP_FPS))
+ 
+ 
+ _, img_bgr = cap.read() # (800, 1920, 3)
+ padding_size = 0
+ resized_width = 1920
+ video_size = (resized_width, int(img_bgr.shape[0] * resized_width // img_bgr.shape[1]))
+ timestamps = [cap.get(cv2.CAP_PROP_POS_MSEC)]
+ prev_time = 0
+ 
+ fourcc = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
+ # out1 = cv2.VideoWriter('./data/record0.mp4',fourcc, fps, frame_size)
+ 
+ while True:
+     retval, frameBGR = cap.read()	# 영상을 한 frame씩 읽어오기
+     current_time = time.time() - prev_time
+ 
+     if(type(frameBGR) == type(None)):
+         pass
+     else:
+         frameBGR = cv2.resize(frameBGR, video_size)
+         frame = cv2.cvtColor(frameBGR, cv2.COLOR_BGR2RGB)
+         
+         if (retval is True) and (current_time > 1.5) :
+             prev_time = time.time()
+             faces = detector(frame, 1)
+             
+             for (i, face) in enumerate(faces):
+                 shape = predictor(frame, face)
+                 face_descriptor = facerec.compute_face_descriptor(frame, shape)
+                 
+                 img = cv2.resize(frame[face.top():face.bottom(), face.left():face.right()], dsize=(224, 224), interpolation = cv2.INTER_CUBIC)
+                 imgarr = np.array(img).reshape(1, 224, 224, 3) /255
+                 emotion = labels_dict_[model.predict(imgarr).argmax(axis=-1)[0]]
+                 # emotion = get_key(model.predict_classes(imgarr))
+ 
+                 
+                 last_found = {'name': 'unknown', 'dist': 0.6, 'color': (0,0,255)}
+                 
+                 for name, saved_desc in descs.items():
+                     dist = np.linalg.norm([face_descriptor] - saved_desc, axis=1)
+                     if dist < last_found['dist']:
+                         last_found = {'name': name, 'dist': dist, 'color': (255,255,255)}
+                 
+                 cv2.rectangle(frameBGR, pt1=(face.left(), face.top()), pt2=(face.right(), face.bottom()), color=last_found['color'], thickness=2)
+                 cv2.putText(frameBGR, last_found['name'] + ',' + emotion , org=(face.left(), face.top()), fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=1, color=last_found['color'], thickness=2)
+                 # cv2.putText(frameBGR, last_found['name'] + ',' , org=(face.left(), face.top()), fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=1, color=last_found['color'], thickness=2)
+             
+                 con_sec, con_min, con_hour = convertMillis(cap.get(cv2.CAP_PROP_POS_MSEC))
+                 time_dict[emotion].append("{0}:{1}:{2}".format(con_hour, con_min, round(con_sec, 3)))
+                 print("{0}:{1}:{2} {3}".format(con_hour, con_min, round(con_sec, 3), emotion))
+                 # print("{0}:{1}:{2} {3}".format(con_hour, con_min, con_sec))
+ 
+         cv2.imshow('frame', frameBGR)
+ 
+     key = cv2.waitKey(25)
+     if key == 27 :
+         break
+ 
+ print(time_dict)       
+ print("총 시간 : ", time.time() - start)
+ if cap.isOpened():
+     cap.release()
+ 
+ for i in range(1,5):
+     cv2.destroyAllWindows()
+     cv2.waitKey(1)
--- a/code/videoTest/video3.py 0 → 100644
View file @fea4c30
+++ b/code/videoTest/video3.py 0 → 100644
View file @fea4c30
+ import dlib
+ import cv2
+ import numpy as np
+ import matplotlib.pyplot as plt
+ import tensorflow as tf
+ import math
+ import os
+ import pathlib
+ import time
+ import pandas as pd
+ import tensorflow as tf
+ from tensorflow.keras.preprocessing.image import ImageDataGenerator,load_img
+ from tensorflow.keras.models import load_model
+ from tensorflow.keras import regularizers
+ from tensorflow import keras
+ from imutils import face_utils
+ import time
+ 
+  
+ start = time.time()
+ detector = dlib.get_frontal_face_detector()
+ predictor = dlib.shape_predictor("./models/shape_predictor_68_face_landmarks.dat")
+ facerec = dlib.face_recognition_model_v1('models/dlib_face_recognition_resnet_model_v1.dat')
+ # model = load_model('../checkpoint/er-best-mobilenet1-bt32-model-adam.h5')
+ model = load_model('../checkpoint/er-best-efficientNet1-bt32-model-SGD.h5')
+     
+     
+ descs = np.load('img/descs2.npy', allow_pickle=True)[()]
+  
+ video_path = './data/zoom_1.mp4'
+ cap=cv2.VideoCapture(video_path)
+  
+ 
+ 
+ # labels_dict_ = {0 : 'angry', 1 : 'fear' ,  2: 'happy', 3: 'neutral', 4:  'sad', 5: 'surprise'}
+ labels_dict_ = {'angry' : 0,'fear' : 1 ,'happy' : 2, 'neutral' : 3,  'sad' : 4, 'surprise' : 5}
+ time_dict = {'angry': [], 'fear': [], 'happy': [], 'neutral': [], 'sad': [], 'surprise': []}
+ def get_key(val):
+     for key, value in labels_dict_.items():
+         if(value == val):
+             return key
+ 
+ 
+ def convertMillis(millis):
+     seconds=(millis/1000)%60 
+     minutes=(millis/(1000*60))%60
+     hours=(millis/(1000*60*60))%24
+     return seconds, int(minutes), int(hours)
+ 
+ #cap = cv2.VideoCapture(0) # 0번 카메라
+  
+ # 동영상 크기(frame정보)를 읽어옴
+ frameWidth = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+ frameHeight = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+ frame_size = (frameWidth, frameHeight)
+ fps = cap.get((cv2.CAP_PROP_FPS))
+ 
+ 
+ _, img_bgr = cap.read() # (800, 1920, 3)
+ padding_size = 0
+ resized_width = 1920
+ video_size = (resized_width, int(img_bgr.shape[0] * resized_width // img_bgr.shape[1]))
+ timestamps = [cap.get(cv2.CAP_PROP_POS_MSEC)]
+ prev_time = 0
+ 
+ fourcc = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
+ # out1 = cv2.VideoWriter('./data/record0.mp4',fourcc, fps, frame_size)
+ 
+ while True:
+     retval, frameBGR = cap.read()	# 영상을 한 frame씩 읽어오기
+     current_time = time.time() - prev_time
+ 
+     if(type(frameBGR) == type(None)):
+         pass
+     else:
+         frameBGR = cv2.resize(frameBGR, video_size)
+         frame = cv2.cvtColor(frameBGR, cv2.COLOR_BGR2RGB)
+         
+         if (retval is True) and (current_time > 1.5) :
+             prev_time = time.time()
+             faces = detector(frame, 1)
+             
+             for (i, face) in enumerate(faces):
+                 shape = predictor(frame, face)
+                 face_descriptor = facerec.compute_face_descriptor(frame, shape)
+                 
+                 img = cv2.resize(frame[face.top():face.bottom(), face.left():face.right()], dsize=(224, 224), interpolation = cv2.INTER_CUBIC)
+                 imgarr = np.array(img).reshape(1, 224, 224, 3) /255
+                 # emotion = labels_dict_[model.predict(imgarr).argmax(axis=-1)[0]]
+                 emotion = get_key(model.predict_classes(imgarr))
+ 
+                 
+                 last_found = {'name': 'unknown', 'dist': 0.6, 'color': (0,0,255)}
+                 
+                 for name, saved_desc in descs.items():
+                     dist = np.linalg.norm([face_descriptor] - saved_desc, axis=1)
+                     if dist < last_found['dist']:
+                         last_found = {'name': name, 'dist': dist, 'color': (255,255,255)}
+                 
+                 cv2.rectangle(frameBGR, pt1=(face.left(), face.top()), pt2=(face.right(), face.bottom()), color=last_found['color'], thickness=2)
+                 cv2.putText(frameBGR, last_found['name'] + ',' + emotion , org=(face.left(), face.top()), fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=1, color=last_found['color'], thickness=2)
+                 # cv2.putText(frameBGR, last_found['name'] + ',' , org=(face.left(), face.top()), fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=1, color=last_found['color'], thickness=2)
+             
+                 con_sec, con_min, con_hour = convertMillis(cap.get(cv2.CAP_PROP_POS_MSEC))
+                 time_dict[emotion].append("{0}:{1}:{2}".format(con_hour, con_min, round(con_sec, 3)))
+                 print("{0}:{1}:{2} {3}".format(con_hour, con_min, round(con_sec, 3), emotion))
+                 # print("{0}:{1}:{2} {3}".format(con_hour, con_min, con_sec))
+ 
+         cv2.imshow('frame', frameBGR)
+ 
+     key = cv2.waitKey(25)
+     if key == 27 :
+         break
+ 
+ print(time_dict)       
+ print("총 시간 : ", time.time() - start)
+ if cap.isOpened():
+     cap.release()
+ 
+ for i in range(1,5):
+     cv2.destroyAllWindows()
+     cv2.waitKey(1)