src/driver.py

from argparse import ArgumentParser

import logging
from input_feeder import InputFeeder
import constants
import os
from face_detection import Face_Model
from facial_landmarks_detection import Landmark_Model
from gaze_estimation import Gaze_Estimation_Model
from head_pose_estimation import Head_Pose_Model
from mouse_controller import MouseController
import cv2
import imutils
import math
# import line_profiler
# profile=line_profiler.LineProfiler()
# import atexit
# atexit.register(profile.print_stats)


def imshow(windowname, frame, width=None):
    if width == None:
        width = 400

    frame = imutils.resize(frame, width=width)
    cv2.imshow(windowname, frame)


def build_argparser():
    parser = ArgumentParser()
    parser.add_argument("-f", "--face", required=True, type=str,
                        help="Path to .xml file of Face Detection model.")
    parser.add_argument("-l", "--landmarks", required=True, type=str,
                        help="Path to .xml file of Facial Landmark Detection model.")
    parser.add_argument("-hp", "--headpose", required=True, type=str,
                        help="Path to .xml file of Head Pose Estimation model.")
    parser.add_argument("-ge", "--gazeestimation", required=True, type=str,
                        help="Path to .xml file of Gaze Estimation model.")
    parser.add_argument("-i", "--input", required=True, type=str,
                        help="Path to video file or enter cam for webcam")
    parser.add_argument("-it", "--input_type", required=True, type=str,
                        help="Provide the source of video frames." + constants.VIDEO + " " + constants.WEBCAM + " | " + constants.IP_CAMERA + " | " + constants.IMAGE)
    parser.add_argument("-debug", "--debug", required=False, type=str, nargs='+',
                        default=[],
                        help="To debug each model's output visually, type the model name with comma seperated after --debug")
    parser.add_argument("-ld", "--cpu_extension", required=False, type=str,
                        default=None,
                        help="linker libraries if have any")
    parser.add_argument("-d", "--device", type=str, default="CPU",
                        help="Provide the target device: "
                             "CPU, GPU, FPGA or MYRIAD is acceptable.")

    return parser

# @profile
def main(args):
    logger = logging.getLogger()

    feeder = None
    if args.input_type == constants.VIDEO or args.input_type == constants.IMAGE:
        extension = str(args.input).split('.')[1]
        # if not extension.lower() in constants.ALLOWED_EXTENSIONS:
        #     logger.error('Please provide supported extension.' + str(constants.ALLOWED_EXTENSIONS))
        #     exit(1)

        # if not os.path.isfile(args.input):
        #     logger.error("Unable to find specified video/image file")
        #     exit(1)

        feeder = InputFeeder(args.input_type, args.input)
    elif args.input_type == constants.IP_CAMERA:
        if not str(args.input).startswith('http://'):
            logger.error('Please provide ip of server with http://')
            exit(1)

        feeder = InputFeeder(args.input_type, args.input)
    elif args.input_type == constants.WEBCAM:
        feeder = InputFeeder(args.input_type)

    mc = MouseController("medium", "fast")

    feeder.load_data()

    face_model = Face_Model(args.face, args.device, args.cpu_extension)
    face_model.check_model()

    landmark_model = Landmark_Model(args.landmarks, args.device, args.cpu_extension)
    landmark_model.check_model()

    # gaze_model = Gaze_Estimation_Model(args.gazeestimation, args.device, args.cpu_extension)
    # gaze_model.check_model()

    head_model = Head_Pose_Model(args.headpose, args.device, args.cpu_extension)
    head_model.check_model()

    face_model.load_model()
    logger.info("Face Detection Model Loaded...")
    landmark_model.load_model()
    logger.info("Landmark Detection Model Loaded...")
    # gaze_model.load_model()
    # logger.info("Gaze Estimation Model Loaded...")
    head_model.load_model()
    logger.info("Head Pose Detection Model Loaded...")
    print('Loaded')

    try:
        frame_count = 0
        for ret, frame in feeder.next_batch():
            if not ret:
                break

            if frame is None:
                continue

            frame_count += 1
            crop_face = None
            if True:

                crop_face, box = face_model.predict(frame.copy())


                if crop_face is None:
                    logger.error("Unable to detect the face.")
                    continue
                imshow('frame', crop_face, width=400)

                (lefteye_x, lefteye_y), (
                    righteye_x, righteye_y), eye_coords, left_eye, right_eye = landmark_model.predict(
                    crop_face.copy(), eye_surrounding_area=15)

                # imshow("left_eye", left_eye, width=100)
                # imshow("right_eye", right_eye, width=100)
                '''TODO dlib is better to crop eye with perfection'''

                head_position = head_model.predict(crop_face.copy())

                if True:
                    if cv2.waitKey(20) & 0xFF == ord('q'):
                        break
                    continue


                gaze, (mousex, mousey) = gaze_model.predict(left_eye.copy(), right_eye.copy(), head_position)

                if (len(args.debug) > 0):
                    debuFrame = frame.copy()
                    if crop_face is None:
                        continue

                    thickness = 2
                    radius = 2
                    color = (0, 0, 255)
                    [[le_xmin, le_ymin, le_xmax, le_ymax], [re_xmin, re_ymin, re_xmax, re_ymax]] = eye_coords

                    if 'face' in args.debug:
                            cv2.rectangle(debuFrame, (box[0], box[1]), (box[2], box[3]), (255, 255, 255), 2)


                            cv2.rectangle(crop_face, (re_xmin, re_ymin), (re_xmax, re_ymax), (100, 255, 100), 2)
                            cv2.rectangle(crop_face, (le_xmin, le_ymin), (le_xmax, le_ymax), (100, 255, 100), 2)

                    '''
                    LandMark
                    '''

                    cv2.circle(crop_face, (lefteye_x, lefteye_y), radius, color, thickness)
                    cv2.circle(crop_face, (righteye_x, righteye_y), radius, color, thickness)

                    debuFrame[box[1]:box[3], box[0]:box[2]] = crop_face


                    if 'headpose' in args.debug:
                        yaw = head_position[0]
                        pitch = head_position[1]
                        roll = head_position[2]

                        sinY = math.sin(yaw * math.pi / 180.0)
                        sinP = math.sin(pitch * math.pi / 180.0)
                        sinR = math.sin(roll * math.pi / 180.0)

                        cosY = math.cos(yaw * math.pi / 180.0)
                        cosP = math.cos(pitch * math.pi / 180.0)
                        cosR = math.cos(roll * math.pi / 180.0)

                        cH, cW = crop_face.shape[:2]
                        arrowLength = 0.4 * cH * cW

                        xCenter = int(cW / 2)
                        yCenter = int(cH / 2)

                        # center to right
                        # cv2.line(crop_face, (xCenter, yCenter),
                        #          (int((xCenter + arrowLength * (cosR * cosY + sinY * sinP * sinR))),
                        #           int((yCenter + arrowLength * cosP * sinR))), (186, 204, 2), 1)
            #
            #             # center to top
            #             cv2.line(crop_face, (xCenter, yCenter),
            #                      (int(((xCenter + arrowLength * (cosR * sinY * sinP + cosY * sinR)))),
            #                       int((yCenter - arrowLength * cosP * cosR))), (186, 204, 2), 1)
            #
            #             # center to forward
            #             cv2.line(crop_face, (xCenter, yCenter),
            #                      (int(((xCenter + arrowLength * sinY * cosP))),
            #                       int((yCenter + arrowLength * sinP))), (186, 204, 2), 1)
            #
                        cv2.putText(crop_face, 'head pose: (y={:.2f}, p={:.2f}, r={:.2f})'.format(yaw, pitch, roll),
                                    (0, 20), cv2.FONT_HERSHEY_SIMPLEX,
                                    0.35, (255, 255, 255), 1)


                    if 'gaze' in args.debug:
                        cH, cW = crop_face.shape[:2]
                        arrowLength = 0.6 * cH

                        gazeArrowX = gaze[0] * arrowLength
                        gazeArrowY = -gaze[1] * arrowLength

                        debuFrame[box[1]:box[3], box[0]:box[2]] = crop_face

                        cv2.arrowedLine(crop_face, (lefteye_x, lefteye_y),
                                        (int(lefteye_x + gazeArrowX), int(lefteye_y + gazeArrowY)), (184, 113, 57), 2)
                        cv2.arrowedLine(crop_face, (righteye_x, righteye_y),
                                        (int(righteye_x + gazeArrowX), int(righteye_y + gazeArrowY)), (184, 113, 57), 2)

                        cv2.putText(crop_face, 'gaze angles: h={}, v={}'.format("!", "2"), (0, 10),
                                    cv2.FONT_HERSHEY_SIMPLEX,
                                    0.35, (255, 255, 255), 1)

                        debuFrame[box[1]:box[3], box[0]:box[2]] = crop_face

            #
            #             imshow("face", crop_face, width=400)
            #             cv2.moveWindow("face", 0, 0)
            #             imshow("debug", debuFrame, width=400)
            #             cv2.moveWindow("debug", cW * 2, cH)

                # try:
                #     if frame_count % 5 == 0:
                #         mc.move(mousex, mousey)
                # except Exception as err:
                #     logger.error("Moving cursor outside the PC not supported yet !!")

            # key = cv2.waitKey(60)
                    imshow('frame', debuFrame, width=1210)

            if cv2.waitKey(20) & 0xFF == ord('q'):
                break
    except Exception as err:
        logger.error(err)

    cv2.destroyAllWindows()
    feeder.close()


if __name__ == '__main__':
    arg = '-f ../models/intel/face-detection-adas-0001/FP16/face-detection-adas-0001.xml -l ../models/intel/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.xml -hp ../models/intel/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.xml -ge ../models/intel/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.xml -i ../bin/demo.mp4 -it video -d CPU -debug headpose gaze face'.split(' ')
    # args = build_argparser().parse_args(arg)
    args = build_argparser().parse_args()

    main(args)