rudy_main.py

import tkinter as tk
import cv2
from PIL import Image, ImageTk
import numpy as np
from tkinter.filedialog import askopenfilename
import shutil
import time
import os
from matplotlib import pyplot
from numpy import asarray
from scipy.spatial.distance import cosine
from mtcnn.mtcnn import MTCNN
from keras_vggface.vggface import VGGFace
from keras_vggface.utils import preprocess_input
import argparse
from wide_resnet import WideResNet
from keras.utils.data_utils import get_file

global fileName1,fileName2

class FaceCV(object):

    CASE_PATH = "pretrained_models\\haarcascade_frontalface_alt.xml"
    WRN_WEIGHTS_PATH = "pretrained_models\\weights.18-4.06.hdf5"

    def __new__(cls, weight_file=None, depth=16, width=8, face_size=64):
        if not hasattr(cls, 'instance'):
            cls.instance = super(FaceCV, cls).__new__(cls)
        return cls.instance

    def __init__(self, depth=16, width=8, face_size=64):
        self.face_size = face_size
        self.model = WideResNet(face_size, depth=depth, k=width)()
        model_dir = os.path.join(os.getcwd(), "pretrained_models").replace("//", "\\")
        fpath = get_file('weights.18-4.06.hdf5', self.WRN_WEIGHTS_PATH, cache_subdir=model_dir)
        self.model.load_weights(fpath)

    def crop_face(self, imgarray, section, margin=40, size=64):
        img_h, img_w, _ = imgarray.shape
        if section is None:
            section = [0, 0, img_w, img_h]
        (x, y, w, h) = section
        margin = int(min(w,h) * margin / 100)
        x_a = x - margin
        y_a = y - margin
        x_b = x + w + margin
        y_b = y + h + margin
        if x_a < 0:
            x_b = min(x_b - x_a, img_w-1)
            x_a = 0
        if y_a < 0:
            y_b = min(y_b - y_a, img_h-1)
            y_a = 0
        if x_b > img_w:
            x_a = max(x_a - (x_b - img_w), 0)
            x_b = img_w
        if y_b > img_h:
            y_a = max(y_a - (y_b - img_h), 0)
            y_b = img_h
        cropped = imgarray[y_a: y_b, x_a: x_b]
        resized_img = cv2.resize(cropped, (size, size), interpolation=cv2.INTER_AREA)
        resized_img = np.array(resized_img)
        return resized_img, (x_a, y_a, x_b - x_a, y_b - y_a)

    def detect_face_image(self, filename):                  
        result_age=0
        result_gender='M'
        face_cascade = cv2.CascadeClassifier(self.CASE_PATH)
        frame = cv2.imread(filename)
        gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
        faces = face_cascade.detectMultiScale(
            gray,
            scaleFactor=1.2,
            minNeighbors=10,
            minSize=(self.face_size, self.face_size)
        )
        if True:
            face_imgs = np.empty((len(faces), self.face_size, self.face_size, 3))
            for i, face in enumerate(faces):
                face_img, cropped = self.crop_face(frame, face, margin=40, size=self.face_size)
                (x, y, w, h) = cropped
                cv2.rectangle(frame, (x, y), (x + w, y + h), (255, 200, 0), 2)
                face_imgs[i,:,:,:] = face_img
            
            if len(face_imgs) > 0:
                # predict ages and genders of the detected faces
                results = self.model.predict(face_imgs)
                predicted_genders = results[0]
                ages = np.arange(0, 101).reshape(101, 1)
                predicted_ages = results[1].dot(ages).flatten()
                print(predicted_genders)
                
            # draw results
            for i, face in enumerate(faces):
                result_gender = "F" if predicted_genders[i][0] > 0.5 else "M"
                result_age = int(predicted_ages[i])
                print(int(predicted_ages[i]),predicted_genders[i][0])
        else:
            print('No faces')
        return result_age, result_gender


def get_args():
    parser = argparse.ArgumentParser(formatter_class=argparse.ArgumentDefaultsHelpFormatter)
    parser.add_argument("--depth", type=int, default=16, help="depth of network")
    parser.add_argument("--width", type=int, default=8, help="width of network")
    args = parser.parse_args()
    return args


class App:
    def __init__(self, window, window_title, video_source):
        self.window = window
        self.window.title(window_title)
        
        # Open the video source
        self.cap = cv2.VideoCapture(video_source)
        self.cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640)
        self.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480)
        
        # Create a canvas that can fit the video source
        self.canvas = tk.Canvas(window, width = self.cap.get(cv2.CAP_PROP_FRAME_WIDTH), height = self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        self.canvas.pack()
        
        # Use PIL (Pillow) to convert the OpenCV image to a Tkinter image
        self.photo = None
        self.update()
        
        dirPath = "testpicture"
        fileList = os.listdir(dirPath)
        for fileName in fileList:
            os.remove(dirPath + "/" + fileName)


        def openphoto():
            global fileName1
            fileName1 = askopenfilename(title='Select image for analysis ', filetypes=[('image files', '.jpg')])
            dst = "testpicture"
            print(fileName1)
            print (os.path.split(fileName1)[-1])
            shutil.copy(fileName1, dst)
            load1 = Image.open(fileName1)
            im1=load1.resize((300,300), Image.ANTIALIAS)
            render = ImageTk.PhotoImage(im1)
            img = tk.Label(image=render, height="300", width="300")
            img.image = render
            img.place(x=500, y=75)

        def openphoto2():
            global fileName2
            fileName2 = askopenfilename(initialdir='', title='Select image for analysis ',filetypes=[('image files', '.jpg')])
            dst = "testpicture"
            print(fileName2)
            print (os.path.split(fileName2)[-1])
            shutil.copy(fileName2, dst)
            load2 = Image.open(fileName2)
            im2=load2.resize((300,300), Image.ANTIALIAS)
            render = ImageTk.PhotoImage(im2)
            img1 = tk.Label(image=render, height="300", width="300")
            img1.image = render
            img1.place(x=500, y=425)

        detector = MTCNN()
        model = VGGFace(model='resnet50', include_top=False, input_shape=(224, 224, 3), pooling='avg')

        def extract_face_live(filename,detector=detector,required_size=(224, 224)):
            pixels = pyplot.imread(filename)
            # detect faces in the image
            results = detector.detect_faces(pixels)
            # extract the bounding box from the first face
            x1, y1, width, height = results[0]['box']
            x2, y2 = x1 + width, y1 + height
            # extract the face
            face = pixels[y1:y2, x1:x2]
            image = Image.fromarray(face)
            image = image.resize(required_size)
            face_array = asarray(image)
            return face_array
        
        def get_embeddings_live(face, model=model):
            samples = asarray(face, 'float32')
            samples = preprocess_input(samples, version=2)
            samples = samples[np.newaxis,:]
            yhat = model.predict(samples)
            return yhat
        
        def open_camera():
            flag=False
            start_time = time.time()
            video_capture = cv2.VideoCapture(0)
            ID_face = extract_face_live(fileName1,detector)
            ID_embedding=get_embeddings_live(ID_face,model)
            while True:
                _, frame = video_capture.read()
                try:
                    result = detector.detect_faces(frame)
                    if result != []:
                        for _ in result:
                            x1, y1, width, height = result[0]['box']
                            x2, y2 = x1 + width, y1 + height
                            # extract the face
                            face = frame[y1:y2, x1:x2]
                            # resize pixels to the model size
                            subject_face = Image.fromarray(face)
                            required_size=(224, 224)
                            subject_face = subject_face.resize(required_size)
                            sample = asarray(subject_face, 'float32')
                            sample = preprocess_input(sample, version=2)
                            subject_embeddings = get_embeddings_live(subject_face)
                            score = cosine(ID_embedding, subject_embeddings)
                            thresh = 0.5
                            if score <= thresh:
                                print('>face is a Match (%.3f <= %.3f)' % (score, thresh))
                                r = tk.Label(text="STATUS: FACE MATCHED", background="white", fg="black", font=("", 15))
                                r.place(x=1000,y=400)
                                flag=True
                            else:
                                print('>face is NOT a Match (%.3f > %.3f)' % (score, thresh))
                except ValueError:
                    pass
                
                cv2.imshow('Video', frame)
                temp_time = time.time()
                print("TIME : ", temp_time-start_time)
                if (cv2.waitKey(1) & 0xFF == ord('q')) or flag==True or (temp_time-start_time)>10:
                    break
            video_capture.release()
            if flag==False:
                r = tk.Label(text='STATUS: FACE NOT MATCHED....', background="white", fg="red", font=("", 15))
                r.place(x=1000,y=400)
            cv2.destroyAllWindows()

        def main():
            def extract_face(filename, required_size=(224, 224)):
                # load image from file
                pixels = pyplot.imread(filename)
                # create the detector, using default weights
                detector = MTCNN()
                # detect faces in the image
                results = detector.detect_faces(pixels)
                # extract the bounding box from the first face
                x1, y1, width, height = results[0]['box']
                x2, y2 = x1 + width, y1 + height
                print("FACE DETECTED.....")
                face = pixels[y1:y2, x1:x2]
                image = Image.fromarray(face)
                image = image.resize(required_size)
                face_array = asarray(image)
                return face_array
        
            # extract faces and calculate face embeddings for a list of photo files
            def get_embeddings(filenames):
                count=0
                faces = [extract_face(f) for f in filenames]
                for f in filenames:
                    args = get_args()
                    depth = args.depth
                    width = args.width
                    face = FaceCV(depth=depth, width=width)
                    age, gender = face.detect_face_image(f)
                    result_str = "AGE : " +  str(age) + " GENDER : " + gender
                    r = tk.Label(text=result_str, background="white", fg="black", font=("", 15))
                    if count==0:
                        r.place(x=500,y=65)
                    else:
                        r.place(x=500, y=400)
                    count=+1

                samples = asarray(faces, 'float32')
                samples = preprocess_input(samples, version=2)
                model = VGGFace(model='resnet50', include_top=False, input_shape=(224, 224, 3), pooling='avg')
                yhat = model.predict(samples)
                return yhat
            
            def is_match(known_embedding, candidate_embedding, thresh=0.5):
                score = cosine(known_embedding, candidate_embedding)
                if score <= thresh:
                    print('>face is a Match (%.3f <= %.3f)' % (score, thresh))
                    r = tk.Label(text="Status: Face Matched", background="white", fg="Brown", font=("", 15))
                    r.place(x=1000,y=400)

                    button = tk.Button(text="Exit", command=exit,height=2,width=10,background="#3b1d7d", fg="black", font=("", 15),activebackground="red")
                    button.place(x=1000,y=600)
                else:
                    print('>face is NOT a Match (%.3f > %.3f)' % (score, thresh))
                    r = tk.Label(text='STATUS: FACE NOT MATCHED....', background="white", fg="black", font=("", 15))
                    r.place(x=1000,y=400)
                    button = tk.Button(text="Exit", command=exit,height=2,width=10,background="#3b1d7d", fg="black", font=("", 15))
                    button.place(x=1000,y=600)
                                
            global fileName1,fileName2      
            filenames = [fileName1,fileName2]
            embeddings = get_embeddings(filenames)
            is_match(embeddings[0], embeddings[1])

        buttonA = tk.Button(text="ANALYSE", command = main,height=1,width=10,fg="black",bg="#3b1d7d",font=("times",15,"bold"))
        buttonA.place(x=1000,y=200)

        buttono = tk.Button(text="OLD PHOTO", command = openphoto,height=1,width=10,fg="black",bg="#3b1d7d",font=("times",15,"bold"))
        buttono.place(x=100,y=200)

        buttonr = tk.Button(text="RECENT PHOTO", command = openphoto2,height=1,width=15,fg="black",bg="#3b1d7d",font=("times",15,"bold"))
        buttonr.place(x=100,y=500)

        buttonr = tk.Button(text="WEB CAMERA", command = open_camera, height=1,width=15,fg="black",bg="#3b1d7d",font=("times",15,"bold"))
        buttonr.place(x=100,y=350)

        window.mainloop()
        self.window.mainloop()
    
    def update(self):
        ret, frame = self.cap.read()
        if ret:
            self.photo = ImageTk.PhotoImage(image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)))
            self.canvas.create_image(0, 0, image = self.photo, anchor = tk.NW) 
        self.window.after(15, self.update)

App(tk.Tk(), "Tkinter Video Looping Background", "video.mp4")