[DL] - MediaPipe / Video Object Detection

MLDL_정리/Sample

[DL] - MediaPipe / Video Object Detection

KimTory 2022. 3. 6. 14:31

👉 개발 환경 : Jupyter Notebook, Python 3.9, MediaPipe, Opencv

✍ Source Code

import cv2
import mediapipe as mp


# face detection, 찾은 detection 영역에 임의의 표시를 위해 변수 선언
mp_face_detection = mp.solutions.face_detection
mp_drawing = mp.solutions.drawing_utils


# For webcam input:
cap = cv2.VideoCapture("c:\\face_video.mp4") # Source Video
# min_detection_confidence 는 0 ~ 1의 값으로 값을 올릴수록 정교하게 object detection 진행
# 0.5 설정 시, 오인식 하는 경향이 있어 70% 정도로 변경
with mp_face_detection.FaceDetection(model_selection=0, min_detection_confidence=0.7) as face_detection:
    while cap.isOpened():
        success, image = cap.read()
        if not success:
          break 

        image.flags.writeable = False
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        results = face_detection.process(image)

        # Draw the face detection annotations on the image.
        image.flags.writeable = True
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        if results.detections:
            # detection 정보는 6가지를 가지고 있음
          for detection in results.detections:
                mp_drawing.draw_detection(image, detection)
                print(detection) # score, x,y, width, height 등..의 정보를 detection 정보 출력
        
                # 특정 위치 가져 오기
                keypoints = detection.location_data.relative_keypoints
                right_eye = keypoints[0] # Right, 눈
                left_eye = keypoints[1] # Left, 눈
                nose_tip = keypoints[2] # 코 끝
                
                h, w, _ = image.shape # src image 세로, 가로 크기 
                
                right_eye = (int(right_eye.x * w), int(right_eye.y * h)) # ()로 감싸서 tuple 형태로 만듦
                left_eye = (int(left_eye.x * w), int(left_eye.y * h))
                nose_tip= (int(nose_tip.x * w), int(nose_tip.y * h))
                # 좌-우 눈에 특정 도형 삽입
                cv2.circle(image, right_eye, 50, (255, 0, 0), 10, cv2.LINE_AA) # 반지름 50, 색은 BGR으로 blue
                cv2.circle(image, left_eye, 50, (0, 255, 0), 10, cv2.LINE_AA) # 반지름 50, 색은 BGR으로 green
                cv2.circle(image, nose_tip, 50, (0, 255, 255), 10, cv2.LINE_AA) # 반지름 50, 색은 BGR으로 yellow
        
        # Webcam이 아니므로, Flip으로 반전 시키지 않음
        # Size를 원본 대비, 0.5 축소
        cv2.imshow('MediaPipe Face Detection', cv2.resize(image, None, fx=0.5, fy=0.5))
        if cv2.waitKey(1) == ord('q'): # "q" Key Click 시, 종료
          break
        
cap.release() # video 할당 변수 메모리 해제
cv2.destroyAllWindows()

✍ OutPut / 좌-우 눈, 코 구분

→ Face Detection 후, 귀 - 눈 - 코 - 입을 구분하기 위해 빨간점 표시