Spaces:

GoodWin
/

Deep-Multi-scale

Sleeping

App Files Files Community

Deep-Multi-scale / FaceLandmarkDetection /face_alignment /api.py

GoodWin

Add files

0f691e2 almost 4 years ago

raw

history blame

7.6 kB

	from __future__ import print_function
	import os
	import torch
	from torch.utils.model_zoo import load_url
	from enum import Enum
	from skimage import io
	from skimage import color
	import numpy as np
	import cv2
	try:
	import urllib.request as request_file
	except BaseException:
	import urllib as request_file

	from .models import FAN, ResNetDepth
	from .utils import *


	class LandmarksType(Enum):
	"""Enum class defining the type of landmarks to detect.

	``_2D`` - the detected points ``(x,y)`` are detected in a 2D space and follow the visible contour of the face
	``_2halfD`` - this points represent the projection of the 3D points into 3D
	``_3D`` - detect the points ``(x,y,z)``` in a 3D space

	"""
	_2D = 1
	_2halfD = 2
	_3D = 3


	class NetworkSize(Enum):
	# TINY = 1
	# SMALL = 2
	# MEDIUM = 3
	LARGE = 4

	def __new__(cls, value):
	member = object.__new__(cls)
	member._value_ = value
	return member

	def __int__(self):
	return self.value

	models_urls = {
	'2DFAN-4': 'https://www.adrianbulat.com/downloads/python-fan/2DFAN4-11f355bf06.pth.tar',
	'3DFAN-4': 'https://www.adrianbulat.com/downloads/python-fan/3DFAN4-7835d9f11d.pth.tar',
	'depth': 'https://www.adrianbulat.com/downloads/python-fan/depth-2a464da4ea.pth.tar',
	}


	class FaceAlignment:
	def __init__(self, landmarks_type, network_size=NetworkSize.LARGE,
	device='cuda', flip_input=False, face_detector='sfd', verbose=False):
	self.device = device
	self.flip_input = flip_input
	self.landmarks_type = landmarks_type
	self.verbose = verbose

	network_size = int(network_size)

	if 'cuda' in device:
	torch.backends.cudnn.benchmark = True

	# Get the face detector
	face_detector_module = __import__('face_alignment.detection.' + face_detector,
	globals(), locals(), [face_detector], 0)
	self.face_detector = face_detector_module.FaceDetector(device=device, verbose=verbose)

	# Initialise the face alignemnt networks
	self.face_alignment_net = FAN(network_size)
	if landmarks_type == LandmarksType._2D:
	network_name = '2DFAN-' + str(network_size)
	else:
	network_name = '3DFAN-' + str(network_size)

	fan_weights = load_url(models_urls[network_name], map_location=lambda storage, loc: storage)
	self.face_alignment_net.load_state_dict(fan_weights)

	self.face_alignment_net.to(device)
	self.face_alignment_net.eval()

	# Initialiase the depth prediciton network
	if landmarks_type == LandmarksType._3D:
	self.depth_prediciton_net = ResNetDepth()

	depth_weights = load_url(models_urls['depth'], map_location=lambda storage, loc: storage)
	depth_dict = {
	k.replace('module.', ''): v for k,
	v in depth_weights['state_dict'].items()}
	self.depth_prediciton_net.load_state_dict(depth_dict)

	self.depth_prediciton_net.to(device)
	self.depth_prediciton_net.eval()

	def get_landmarks(self, image_or_path, detected_faces=None):
	"""Deprecated, please use get_landmarks_from_image

	Arguments:
	image_or_path {string or numpy.array or torch.tensor} -- The input image or path to it.

	Keyword Arguments:
	detected_faces {list of numpy.array} -- list of bounding boxes, one for each face found
	in the image (default: {None})
	"""
	return self.get_landmarks_from_image(image_or_path, detected_faces)

	def get_landmarks_from_image(self, image_or_path, detected_faces=None):
	"""Predict the landmarks for each face present in the image.

	This function predicts a set of 68 2D or 3D images, one for each image present.
	If detect_faces is None the method will also run a face detector.

	Arguments:
	image_or_path {string or numpy.array or torch.tensor} -- The input image or path to it.

	Keyword Arguments:
	detected_faces {list of numpy.array} -- list of bounding boxes, one for each face found
	in the image (default: {None})
	"""
	if isinstance(image_or_path, str):
	try:
	image = io.imread(image_or_path)
	except IOError:
	print("error opening file :: ", image_or_path)
	return None
	else:
	image = image_or_path

	if image.ndim == 2:
	image = color.gray2rgb(image)
	elif image.ndim == 4:
	image = image[..., :3]

	if detected_faces is None:
	detected_faces = self.face_detector.detect_from_image(image[..., ::-1].copy())

	if len(detected_faces) == 0:
	print("Warning: No faces were detected.")
	return None

	torch.set_grad_enabled(False)
	landmarks = []
	for i, d in enumerate(detected_faces):
	center = torch.FloatTensor(
	[d[2] - (d[2] - d[0]) / 2.0, d[3] - (d[3] - d[1]) / 2.0])
	center[1] = center[1] - (d[3] - d[1]) * 0.12
	scale = (d[2] - d[0] + d[3] - d[1]) / self.face_detector.reference_scale

	inp = crop(image, center, scale)
	inp = torch.from_numpy(inp.transpose(
	(2, 0, 1))).float()

	inp = inp.to(self.device)
	inp.div_(255.0).unsqueeze_(0)

	out = self.face_alignment_net(inp)[-1].detach()
	if self.flip_input:
	out += flip(self.face_alignment_net(flip(inp))
	[-1].detach(), is_label=True)
	out = out.cpu()

	pts, pts_img = get_preds_fromhm(out, center, scale)
	pts, pts_img = pts.view(68, 2) * 4, pts_img.view(68, 2)

	if self.landmarks_type == LandmarksType._3D:
	heatmaps = np.zeros((68, 256, 256), dtype=np.float32)
	for i in range(68):
	if pts[i, 0] > 0:
	heatmaps[i] = draw_gaussian(
	heatmaps[i], pts[i], 2)
	heatmaps = torch.from_numpy(
	heatmaps).unsqueeze_(0)

	heatmaps = heatmaps.to(self.device)
	depth_pred = self.depth_prediciton_net(
	torch.cat((inp, heatmaps), 1)).data.cpu().view(68, 1)
	pts_img = torch.cat(
	(pts_img, depth_pred * (1.0 / (256.0 / (200.0 * scale)))), 1)

	landmarks.append(pts_img.numpy())

	return landmarks

	def get_landmarks_from_directory(self, path, extensions=['.jpg', '.png'], recursive=True, show_progress_bar=True):
	detected_faces = self.face_detector.detect_from_directory(path, extensions, recursive, show_progress_bar)

	predictions = {}
	for image_path, bounding_boxes in detected_faces.items():
	image = io.imread(image_path)
	preds = self.get_landmarks_from_image(image, bounding_boxes)
	predictions[image_path] = preds

	return predictions

	@staticmethod
	def remove_models(self):
	base_path = os.path.join(appdata_dir('face_alignment'), "data")
	for data_model in os.listdir(base_path):
	file_path = os.path.join(base_path, data_model)
	try:
	if os.path.isfile(file_path):
	print('Removing ' + data_model + ' ...')
	os.unlink(file_path)
	except Exception as e:
	print(e)