Source code for meerqat.image.face_recognition

"""Usage: <dataset> [<config> --disable_caching]

--disable_caching                       Disables Dataset caching (useless when using save_to_disk), see datasets.set_caching_enabled()

from docopt import docopt
import json
from pathlib import Path
import warnings

import numpy as np

import torch
    from arcface_torch.backbones import get_model
except ImportError as e:
    warnings.warn(f"Got the following ImportError: {e}.\n Please install arcface_torch as instructed in README.")
from datasets import load_from_disk, set_caching_enabled

from torchvision.transforms import Compose, ToTensor, Normalize
import cv2
from skimage import transform
from PIL import Image

from import DATA_ROOT_PATH, load_image
from ..models.utils import device

    "r50": ARCFACE_PATH/"ms1mv3_arcface_r50_fp16"/"backbone.pth"
# taken from
SRC = np.array([
    [30.2946, 51.6963],
    [65.5318, 51.5014],
    [48.0252, 71.7366],
    [33.5493, 92.3655],
    [62.7299, 92.2041]], dtype=np.float32)
SRC[:, 0] += 8.0

[docs]def similarity_transform(image, landmarks, src, tform, image_size=112): """Adapted from""" # FIXME is there a way to do this without going from Image to ndarray to Image? tform.estimate(landmarks, src) M = tform.params[0:2, :] transformed_face = cv2.warpAffine(np.array(image, dtype=np.uint8), M, (image_size, image_size), borderValue=0.0) return Image.fromarray(transformed_face)
[docs]def from_pretrained(model_name='r50', fp16=True, train=False): model = get_model(model_name, fp16=fp16) weight_path = PRETRAINED_MODELS[model_name] state_dict = torch.load(weight_path, map_location=device) model.load_state_dict(state_dict) model.train(train) return
[docs]def get_pil_preprocessor(): """Use to preprocess PIL image of shape (H x W x C) loaded using'RGB')""" return Compose([ ToTensor(), Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)) ])
[docs]def compute_face_embedding(batch, model, preprocessor, tform, max_n_faces=1, image_key='image'): # 1. filter out images without any detected faces output = [] not_None_values, not_None_values_indices = [], [] for i, (image, landmarks) in enumerate(zip(batch[image_key], batch['face_landmarks'])): # will be overwritten for not_None_values output.append(None) if landmarks is not None: image = load_image(image) landmarks = np.array(landmarks[:max_n_faces], dtype=np.float32) for landmark in landmarks: face = similarity_transform(image, landmark, SRC, tform) not_None_values.append(preprocessor(face).unsqueeze(0)) not_None_values_indices.append((i, landmarks.shape[0])) # None of the image had a face detected if not not_None_values: batch['face_embedding'] = output return batch # 2. compute face embedding not_None_values =, axis=0).to(device=device) not_None_output = model(not_None_values) # 3. return the results in a list of list with proper indices j = 0 for i, n_faces in not_None_values_indices: output[i] = not_None_output[j: j+n_faces] j += n_faces batch['face_embedding'] = output return batch
[docs]def dataset_compute_face_embedding(dataset_path, map_kwargs={}, pretrained_kwargs={}, fn_kwargs={}): dataset = load_from_disk(dataset_path) model = from_pretrained(**pretrained_kwargs) preprocessor = get_pil_preprocessor() tform = transform.SimilarityTransform() fn_kwargs.update(dict(model=model, preprocessor=preprocessor, tform=tform)) dataset =, batched=True, fn_kwargs=fn_kwargs, **map_kwargs) dataset.save_to_disk(dataset_path)
if __name__ == '__main__': args = docopt(__doc__) set_caching_enabled(not args['--disable_caching']) config_path = args['<config>'] if config_path is not None: with open(config_path, 'rt') as file: config = json.load(file) else: config = {} dataset_compute_face_embedding(args['<dataset>'], **config)