transform.py

#!/usr/bin/env python

'''
Create a new dataset by
	1. Extracting physical features from images
	2. Applying attractiveness algorithms to images
		- Rule of thirds
		- Rule of fifths
		- Golden ratio
	3. Aggregate relevant data points from all data sets
'''

from multiprocessing import Pool
from algorithms import *
import pandas as pd
import numpy as np
import argparse
import base64
import model
import dlib
import math
import json
import cv2
import os

# Global var for path to volume within container
PATH_TO_VOLUME = os.path.join(os.getcwd(), 'data')
if not os.path.exists(PATH_TO_VOLUME):
    os.mkdir(PATH_TO_VOLUME)

'''
Helper functions
'''
def b64_to_img(uri):
	encoded_data = uri.split(',')[1]
	nparr = np.frombuffer(base64.b64decode(encoded_data), np.uint8)
	img = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
	return img

def euclidean_distance(a, b):
	x1 = a[0]; y1 = a[1]
	x2 = b[0]; y2 = b[1]
	return math.sqrt(((x2 - x1) * (x2 - x1)) + ((y2 - y1) * (y2 - y1)))

def rotate_img(img, angle):
	img_center = tuple(np.array(img.shape[1::-1]) / 2)
	rot_mat = cv2.getRotationMatrix2D(img_center, angle, 1.0)
	result = cv2.warpAffine(img, rot_mat, img.shape[1::-1], flags=cv2.INTER_LINEAR)
	return result

def detect_landmarks(x, y, w, h, img):
	# Read-in dlib shape predictor from http://dlib.net/files/shape_predictor_68_face_landmarks.dat.bz2
	predictor = dlib.shape_predictor('/usr/bin/shape_predictor_68_face_landmarks.dat')
	# Convert the cv2 rectangle coordinates to Dlib rectangle
	dlib_rect = dlib.rectangle(x, y, x+w, y+h)
	# Detect landmarks
	detected_landmarks = predictor(img, dlib_rect).parts()
	# Convert landmarks to np matrix (containes indices of landmarks)
	landmarks = np.matrix([[p.x,p.y] for p in detected_landmarks])
	return landmarks

'''
Rotate a contestant's photo so that their face is straight
Guidance from: https://sefiks.com/2020/02/23/face-alignment-for-face-recognition-in-python-within-opencv/
'''
def get_face_rotation(img):
	# Load pre-trained classifiers
	face_cascade = cv2.CascadeClassifier(f'{cv2.data.haarcascades}haarcascade_frontalface_default.xml')
	mouth_cascade = cv2.CascadeClassifier(f'{cv2.data.haarcascades}haarcascade_mcs_mouth.xml')
	eye_cascade = cv2.CascadeClassifier(f'{cv2.data.haarcascades}haarcascade_eye.xml')

	# Convert to grayscale
	img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
	# Apply a Gaussian blur with a 3 x 3 kernel to help remove high frequency noise
	img_gauss = cv2.GaussianBlur(img_gray,(3,3), 0)

	# Detect contestant's face
	# https://stackoverflow.com/questions/20801015/recommended-values-for-opencv-detectmultiscale-parameters
	faces = face_cascade.detectMultiScale(img_gauss, scaleFactor=1.05, minNeighbors=6, minSize=(20,20), flags=cv2.CASCADE_SCALE_IMAGE)
	face_index = 0
	for face in faces:
		(x, y, w, h) = face
		# Get face image
		face_img = img_gauss[y:y+h, x:x+w]
		# Detect a mouth
		mouth = mouth_cascade.detectMultiScale(face_img, scaleFactor=1.05, minNeighbors=6)
		if len(mouth) > 0:
			# Detect eyes JUST for second check that detected face is truly a face
			eyes = eye_cascade.detectMultiScale(face_img, scaleFactor=1.05, minNeighbors=1)
			# Ensure that at least one eye was detected
			if len(eyes) > 0:
				# Detect landmarks -- NOTE: it seems as if all landmarks are truly at point landmark-1
				landmarks = detect_landmarks(x, y, w, h,img)
				# Get the center point of (midpoint between) each eye
				# Get top left and bottom right points of right eye
				if landmarks[37, 1] > landmarks[38, 1]:
					y = landmarks[38, 1]
				else:
					y = landmarks[37, 1]
				right_top_left = (landmarks[36,0], y)
				if landmarks[41, 1] > landmarks[40, 1]:
					y = landmarks[41, 1]
				else:
					y = landmarks[40, 1]
				right_bottom_right = (landmarks[39,0], y)
				# Get top left and bottom right points of left eye
				if landmarks[43, 1] > landmarks[44,1]:
					y = landmarks[44,1]
				else:
					y = landmarks[43,1]
				left_top_left = (landmarks[42,0], y)
				if landmarks[47, 1] > landmarks[46, 1]:
					y = landmarks[47, 1]
				else:
					y = landmarks[46, 1]
				left_bottom_right = (landmarks[45,0], y)
				# Get the center points of each eye (midpoint formula)
				right_x = (right_top_left[0] + right_bottom_right[0])//2
				right_y = (right_top_left[1] + right_bottom_right[1])//2
				right_center = (right_x, right_y)
				left_x = (left_top_left[0] + left_bottom_right[0])//2
				left_y = (left_top_left[1] + left_bottom_right[1])//2
				left_center = (left_x, left_y)

				# Evaluate the location of the horizontal point and direction of rotation (clockwise or counterclockwise)
				if left_y < right_y:
					horiz_point = (right_x, left_y)
					direction = -1 # clockwise
				else:
					horiz_point = (left_x, right_y)
					direction = 1 # counterclockwise

				# Evaluate the edge lengths of the triangle made up of the line between the center of the eyes, a perfectly horizontal line, and a perfectly vertical line (with euclidean distance)
				a = euclidean_distance(left_center, horiz_point)
				b = euclidean_distance(right_center, left_center)
				c = euclidean_distance(right_center, horiz_point)

				# Find the possible angle of rotation with arc cosine (inverse)
				if b > 0 and c > 0: # Ensure no division by 0
					arc_cos = (b*b + c*c - a*a)/(2*b*c)
				else:
					arc_cos = 0
				angle = np.arccos(arc_cos)
				# Convert angle from radians to degrees
				angle = (angle * 180) / math.pi

				# If rotating clockwise, evaluate angle by negative evaluation of 90-angle (sum of all angles of a triangle = 180, we've already created a right 90 degree angle between the horizontal/vertical lines and line between center of the eyes)
				if direction == -1:
					angle = 0-(90 - angle)

				# Return the angle to rotate
				return face_index, angle
		face_index += 1
	return None, None

'''
Crop a contestant's photo to just their face
'''
def process_face(id, name, b64photo):
	# Initialize data model handler object
	bachmodel = model.bachmodel(PATH_TO_VOLUME)

	# Load pre-trained classifier
	face_cascade = cv2.CascadeClassifier(f'{cv2.data.haarcascades}haarcascade_frontalface_default.xml')

	# Extract image extension
	ext = f'''.{b64photo.split(';base64')[0].split('/')[-1]}'''
	# Convert base64 encoded photo to a cv2 image
	img = b64_to_img(b64photo)

	# Find detected face index and rotation angle for image
	face_index, rotation_angle = get_face_rotation(img)
	# Rotate image
	img_straight = rotate_img(img, rotation_angle)

	# Many thanks to https://github.com/rajendra7406-zz/FaceShape -->
	# Make a copy of the original (straightened) image
	img_original = img_straight.copy()
	# Convert to grayscale
	img_gray = cv2.cvtColor(img_straight, cv2.COLOR_BGR2GRAY)
	# Apply a Gaussian blur with a 3 x 3 kernel to help remove high frequency noise
	img_gauss = cv2.GaussianBlur(img_gray,(3,3), 0)

	# Detect contestant's face
	# https://stackoverflow.com/questions/20801015/recommended-values-for-opencv-detectmultiscale-parameters
	faces = face_cascade.detectMultiScale(img_gauss, scaleFactor=1.05, minNeighbors=6, minSize=(20,20), flags=cv2.CASCADE_SCALE_IMAGE)
	if len(faces) > 0:
		# Handle the case that a face is not detected this time around or face_index is null
		if not face_index or len(faces) <= face_index:
			face_index = 0

		# Use face at face_index (from rotation angle evaluation)
		(x, y, w, h) = faces[face_index]

		# Detect landmarks
		landmarks = detect_landmarks(x, y, w, h, img_straight)

		# Save left and right cheek points
		cheek_left = (landmarks[1,0],landmarks[1,1])
		cheek_right = (landmarks[15,0],landmarks[15,1])
		# Save left and right jaw points (only in the case that the distance between these two points is larger than the distance between the two cheek points)
		jaw_left = (landmarks[3,0],landmarks[3,1])
		jaw_right = (landmarks[13,0],landmarks[13,1])
		# Save top (of forehead) and bottom (of chin) face points
		face_bottom = (landmarks[8,0],landmarks[8,1])
		face_top = (landmarks[8,0],y)
		# Find top right and bottom left points of rectangle around face
		if cheek_left[0] < jaw_left[0]:
			top_left = (cheek_left[0], face_top[1])
		else:
			top_left = (jaw_left[0], face_top[1])
		if cheek_right[0] > cheek_right[0]:
			bottom_right = (cheek_right[0], face_bottom[1])
		else:
			bottom_right = (jaw_right[0], face_bottom[1])

		# Crop photo to just contestant's face
		img_cropped = img_original[top_left[1]:bottom_right[1], top_left[0]:bottom_right[0]]

		# Resize image to height == 150 (for standardization)
		resize_height = 150
		# Calculate the ratio of the height and construct the dimensions
		h, w, c = img_cropped.shape
		ratio = resize_height / h
		dimensions = (int(w * ratio), resize_height)
		try:
			img_resized = cv2.resize(img_cropped, dimensions, interpolation=cv2.INTER_AREA)
		except Exception as e:
			print(f'  💔 {e}')
			img_resized = np.array([])

		if img_resized.size > 0:
			# Encode resized, cropped image as base64 string
			b64face = f'''data:image/jpeg;base64,{base64.b64encode(cv2.imencode(ext, img_resized)[1]).decode()}'''

			# Lastly, detect new landmarks
			h, w, c = img_resized.shape
			landmarks = detect_landmarks(0, 0, w, h, img_resized).tolist()

			# Model the data
			record = {
				'id': str(id),
				'name': name,
				'dlib_landmarks': landmarks,
				'face_photo': b64face,
				'face_height': h,
				'face_width': w
			}
		else:
			record = {}
	else:
		record = {}
	if len(record) > 0:
		# Model the record
		record = bachmodel.model_one(5, record)
	# Return the record
	return id, record

def eval_rule_of_thirds(id, name, face, dlib_landmarks):
	# Evaluate rule of thirds
	results = rule_of_thirds.evaluate(b64_to_img(face), np.array(dlib_landmarks))
	# Return
	return id, results

def eval_rule_of_fifths(id, name, face, dlib_landmarks):
	# Evaluate rule of thirds
	results = rule_of_fifths.evaluate(b64_to_img(face), np.array(dlib_landmarks))
	# Return
	return id, results

def eval_golden_ratio(id, name, face, dlib_landmarks):
	# Evaluate rule of thirds
	results = golden_ratio.evaluate(b64_to_img(face), np.array(dlib_landmarks))
	# Return
	return id, results

def main():
	# Retrieve args
	parser = argparse.ArgumentParser(description='Process contestant data')
	parser.add_argument('--preprocess', dest='preprocess', action='store_true', help='preprocess the data (rotate, crop, and identify dlib landmarks) for data set 5')
	parser.add_argument('--evaluate', dest='evaluate', action='store_true', help='evaluate data set 5 with the algorithms')
	parser.add_argument('--algorithm', dest='algorithm', type=str, nargs='+', default=['thirds','fifths','golden'], help='a string algorithm name to perform (thirds, fifths, and/or golden)')
	parser.add_argument('--contestant', dest='contestant', type=str, nargs='+', default=[], help='a string contestant first and last name separated by "_" (i.e. joelle_fletcher)')
	args = parser.parse_args()

	# Initialize multiprocessing pool with 5 threads
	pool = Pool(processes=5)

	# Initialize data model handler object
	bachmodel = model.bachmodel(PATH_TO_VOLUME)

	# Initialize dataframe variable
	df5 = None

	# Evaluate flags
	if (args.preprocess and args.evaluate) or (not args.preprocess and not args.evaluate):
		preprocess = True
		evaluate = True
	elif args.preprocess and not args.evaluate:
		preprocess = True
		evaluate = False
	elif not args.preprocess and args.evaluate:
		preprocess = False
		evaluate = True

	# If the user wants to preprocess the data
	if preprocess:
		print('🌹 Preprocessing data for data set 5')
		# If no contestants are given by the user, process every contestant from data set 3 in the database
		if len(args.contestant) == 0:
			# Read-in ds3 as dataframe
			df3 = bachmodel.retrieve_df(3)
			if not df3.empty:
				# Retrieve list of contestants
				contestants = df3[['id', 'name', 'photo']].values.tolist()
			if len(contestants) == 0:
				print(f'  💔 Unable to compile data set 5. Has data set 3 been collected and stored?')
		else:
			# Read-in ds3 as dataframe
			df3 = bachmodel.retrieve_df(3)
			if not df3.empty:
				contestants = []
				for contestant in args.contestant:
					names = contestant.lower().split('_')
					name = f'''{names[0][0].upper()}{names[0][1:].lower()} {names[1][0].upper()}{names[1][1:].lower()}'''
					# Get contestant's id, name, and photo
					contestant = df3.loc[df3['name']==name][['id', 'name', 'photo']].values.tolist()
					if len(contestant) > 0:
						contestants += contestant
		# Multiprocess rotating, cropping, and finding facial landmarks of contestants' faces via their photos
		ds5_resp = pool.starmap_async(process_face, contestants)
		# Separate good and empty response records
		ds5_recs = []
		ds5_null = []
		for resp in ds5_resp.get():
			if len(resp[1]) > 0:
				ds5_recs.append(resp[1])
			else:
				ds5_null.append(resp[0])
		# Attempt to retrieve and preprocess Instagram profile pictures from the contestants whose headshots from the show were not preprocessed successfully
		if len(ds5_null) > 0:
			# Load data set 4
			df4 = bachmodel.retrieve_df(4)
			if not df4.empty:
				contestants = []
				for id in ds5_null:
					contestant = df4.loc[df4['id']==id][['id', 'name', 'prof_photo']].values.tolist()
					if len(contestant) > 0:
						contestants.append(contestant[0])
				# Multiprocess preprocessing again
				ds5_resp = pool.starmap_async(process_face, contestants)
				ds5_recs += [resp[1] for resp in list(ds5_resp.get()) if len(resp[1])>0]
		df5 = pd.DataFrame(ds5_recs)
		# Save data set 5
		bachmodel.save_df(df5, 5)

	# Perform algorithms if specified
	if evaluate:
		# If data set 5 hasn't been read-in to a dataframe, attempt to read data set 5 from pickled file
		if not isinstance(df5, pd.DataFrame):
			df5 = bachmodel.retrieve_df(5)
		if not df5.empty:
			# If no contestants are given by the user, retrieve all pre-processed document ids (contestant names) from the database
			if len(args.contestant) == 0:
				# Retrieve contestants' ids, name, face, and dlib landmarks
				contestants = df5[['id', 'name', 'face_photo', 'dlib_landmarks']].values.tolist()
				if len(contestants) == 0:
					print(f'  💔 Unable to evaluate rule of thirds. Has data set 5 been collected, preprocessed, and stored?')
			else:
				for contestant in args.contestant:
					names = contestant.lower().split('_')
					name = f'''{names[0][0].upper()}{names[0][1:].lower()} {names[1][0].upper()}{names[1][1:].lower()}'''
					# Get contestant's id, name, face, and dlib landmarks
					contestant = df5.loc[df5['name']==name][['id', 'name', 'face_photo', 'dlib_landmarks']].values.tolist()
		# Rule of thirds
		if 'thirds' in args.algorithm:
			print('🌹 Evaluating the Rule of Thirds')
			# Multiprocess
			ds5_resp = pool.starmap_async(eval_rule_of_thirds, contestants)
			# Update data set 5 dataframe
			for resp in ds5_resp.get():
				id = resp[0]
				rec = resp[1]
				for key, value in rec.items():
					df5.loc[df5['id'] == id, [key]] = value
			# Save data set 5
			bachmodel.save_df(df5, 5)
		# Rule of fifths
		if 'fifths' in args.algorithm:
			print('🌹 Evaluating the Rule of Fifths')
			# Multiprocess
			ds5_resp = pool.starmap_async(eval_rule_of_fifths, contestants)
			# Update data set 5 dataframe
			for resp in ds5_resp.get():
				id = resp[0]
				rec = resp[1]
				for key, value in rec.items():
					df5.loc[df5['id'] == id, [key]] = value
			# Save data set 5
			bachmodel.save_df(df5, 5)
		# Golden ratio
		if 'golden' in args.algorithm:
			print('🌹 Evaluating the Golden Ratio')
			# Multiprocess
			ds5_resp = pool.starmap_async(eval_golden_ratio, contestants)
			# Update data set 5 dataframe
			for resp in ds5_resp.get():
				id = resp[0]
				rec = resp[1]
				for key, value in rec.items():
					df5.loc[df5['id'] == id, [key]] = value
			# Save data set 5
			bachmodel.save_df(df5, 5)

if __name__ == '__main__':
	main()