age-gender-emotion.py

import cv2
import os
from time import sleep
import numpy as np
import argparse
from wide_resnet import WideResNet
from keras.utils.data_utils import get_file
from keras.models import load_model


class FaceCV(object):

    CASE_PATH = "haarcascade_frontalface_alt.xml"

    
    def __new__(cls, weight_file=None, depth=16, width=8, face_size=64):
        if not hasattr(cls, 'instance'):
            cls.instance = super(FaceCV, cls).__new__(cls)
        return cls.instance

    def __init__(self, depth=16, width=8, face_size=64):
        self.face_size = face_size
        self.model_ag = WideResNet(face_size, depth=depth, k=width)()
        self.model_emo = load_model('models/fer2013.hdf5')
        self.mapper = {0: "Angry", 1: "Disgust", 2: "Fear", 3: "Happy", 4: "Sad", 5: "Surprise", 6: "Neutral"}
        self.model_ag.load_weights('models/age-gender.hdf5')

    @classmethod
    def draw_label(cls, image, point, label, font=cv2.FONT_HERSHEY_SIMPLEX,
                   font_scale=1, thickness=2):
        size = cv2.getTextSize(label, font, font_scale, thickness)[0]
        x, y = point
        cv2.rectangle(
            image, (x, y - size[1]), (x + size[0], y), (255, 0, 0), cv2.FILLED)
        cv2.putText(image, label, point, font, font_scale,
                    (255, 255, 255), thickness)

    
    def detect_face(self):

        face_cascade = cv2.CascadeClassifier(
            cv2.data.haarcascades + self.CASE_PATH)
        face_cascade.empty()

        video_capture = cv2.VideoCapture(0)
        #  break by key ESC
        while True:
            if not video_capture.isOpened():
                sleep(5)
            ret, frame = video_capture.read()
            gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
            faces = face_cascade.detectMultiScale(
                gray,
                scaleFactor=1.2,
                minNeighbors=10,
                minSize=(self.face_size, self.face_size)
            )
            if faces is not ():

                face_imgs = np.empty(
                    (len(faces), self.face_size, self.face_size, 3))
                for i, face in enumerate(faces):
                    face_img,em_img, cropped = self.crop_face(
                        frame, face, margin=40, size=self.face_size)
                    (x, y, w, h) = cropped
                    cv2.rectangle(frame, (x, y), (x + w, y + h),
                                  (255, 200, 0), 2)
                    face_imgs[i, :, :, :] = face_img

                if len(face_imgs) > 0:
                    # predict ages and genders of the detected faces

                    results = self.model_ag.predict(face_imgs)
                    

                    em_img = em_img.astype('float32')
                    em_img = em_img/255.
                    em_img = np.expand_dims(em_img, 0)
                    em_img = np.expand_dims(em_img, -1)

                    
                    emotion = self.mapper[np.argmax(self.model_emo.predict(em_img))]
                    predicted_genders = results[0]
                    ages = np.arange(0, 101).reshape(101, 1)
                    predicted_ages = results[1].dot(ages).flatten()

                # draw results
                for i, face in enumerate(faces):
                    label = "{}, {}, {}".format(int(predicted_ages[i]),
                                            "F" if predicted_genders[i][0] > 0.5 else "M",emotion)

                    self.draw_label(frame, (face[0], face[1]), label)
            else:
                pass

            cv2.imshow('Keras Faces', frame)
            if cv2.waitKey(5) == 27:  # ESC key press
                break
        # When everything is done, release the capture
        video_capture.release()
        cv2.destroyAllWindows()

    def crop_face(self, imgarray, section, margin=40, size=64):
       
        img_h, img_w, _ = imgarray.shape
        if section is None:
            section = [0, 0, img_w, img_h]
        (x, y, w, h) = section
        margin = int(min(w, h) * margin / 100)
        x_a = x - margin
        y_a = y - margin
        x_b = x + w + margin
        y_b = y + h + margin
        if x_a < 0:
            x_b = min(x_b - x_a, img_w-1)
            x_a = 0
        if y_a < 0:
            y_b = min(y_b - y_a, img_h-1)
            y_a = 0
        if x_b > img_w:
            x_a = max(x_a - (x_b - img_w), 0)
            x_b = img_w
        if y_b > img_h:
            y_a = max(y_a - (y_b - img_h), 0)
            y_b = img_h
        cropped = imgarray[y_a: y_b, x_a: x_b]
        resized_img = cv2.resize(
            cropped, (size, size), interpolation=cv2.INTER_AREA)
        resized_img = np.array(resized_img)
        
        
        gray = cv2.cvtColor(cropped, cv2.COLOR_BGR2GRAY)
        resized_img2 = cv2.resize(
            gray, (64,64), interpolation=cv2.INTER_AREA)
        resized_img2 = np.array(resized_img2)
        return resized_img,resized_img2, (x_a, y_a, x_b - x_a, y_b - y_a)


def main():

    
    face = FaceCV()

    face.detect_face()


if __name__ == "__main__":
    main()