openface/demos/compare.py

109 lines
3.6 KiB
Python
Raw Normal View History

2015-09-30 06:07:12 +08:00
#!/usr/bin/env python2
#
# Example to compare the faces in two images.
# Brandon Amos
# 2015/09/29
#
# Copyright 2015 Carnegie Mellon University
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import time
start = time.time()
2015-09-30 06:07:12 +08:00
import argparse
import cv2
import itertools
2015-09-30 06:07:12 +08:00
import os
import numpy as np
np.set_printoptions(precision=2)
import sys
fileDir = os.path.dirname(os.path.realpath(__file__))
2015-10-09 22:48:06 +08:00
import openface
import openface.helper
from openface.data import iterImgs
from openface.alignment import NaiveDlib # Depends on dlib.
2015-09-30 06:07:12 +08:00
modelDir = os.path.join(fileDir, '..', 'models')
dlibModelDir = os.path.join(modelDir, 'dlib')
2015-10-09 22:48:06 +08:00
openfaceModelDir = os.path.join(modelDir, 'openface')
2015-09-30 06:07:12 +08:00
parser = argparse.ArgumentParser()
parser.add_argument('imgs', type=str, nargs='+', help="Input images.")
2015-09-30 06:07:12 +08:00
parser.add_argument('--dlibFacePredictor', type=str, help="Path to dlib's face predictor.",
default=os.path.join(dlibModelDir, "shape_predictor_68_face_landmarks.dat"))
parser.add_argument('--networkModel', type=str, help="Path to Torch network model.",
2015-10-09 22:48:06 +08:00
default=os.path.join(openfaceModelDir, 'nn4.v1.t7'))
2015-10-12 23:30:29 +08:00
parser.add_argument('--imgDim', type=int,
help="Default image dimension.", default=96)
2015-10-09 21:54:15 +08:00
parser.add_argument('--cuda', action='store_true')
parser.add_argument('--verbose', action='store_true')
2015-09-30 06:07:12 +08:00
args = parser.parse_args()
if args.verbose:
2015-10-12 23:30:29 +08:00
print("Argument parsing and loading libraries took {} seconds.".format(
time.time() - start))
2015-09-30 06:07:12 +08:00
start = time.time()
align = NaiveDlib(args.dlibFacePredictor)
2015-10-09 22:48:06 +08:00
net = openface.TorchWrap(args.networkModel, imgDim=args.imgDim, cuda=args.cuda)
if args.verbose:
2015-10-12 23:30:29 +08:00
print("Loading the dlib and OpenFace models took {} seconds.".format(
time.time() - start))
2015-09-30 06:07:12 +08:00
def getRep(imgPath):
if args.verbose:
print("Processing {}.".format(imgPath))
bgrImg = cv2.imread(imgPath)
if bgrImg is None:
2015-09-30 06:07:12 +08:00
raise Exception("Unable to load image: {}".format(imgPath))
rgbImg = cv2.cvtColor(bgrImg, cv2.COLOR_BGR2RGB)
if args.verbose:
print(" + Original size: {}".format(rgbImg.shape))
2015-09-30 06:07:12 +08:00
start = time.time()
bb = align.getLargestFaceBoundingBox(rgbImg)
2015-09-30 06:07:12 +08:00
if bb is None:
raise Exception("Unable to find a face: {}".format(imgPath))
if args.verbose:
2015-10-12 23:30:29 +08:00
print(" + Face detection took {} seconds.".format(time.time() - start))
2015-09-30 06:07:12 +08:00
start = time.time()
alignedFace = align.alignImg("affine", args.imgDim, rgbImg, bb)
2015-09-30 06:07:12 +08:00
if alignedFace is None:
raise Exception("Unable to align image: {}".format(imgPath))
if args.verbose:
2015-10-12 23:30:29 +08:00
print(" + Face alignment took {} seconds.".format(time.time() - start))
2015-09-30 06:07:12 +08:00
start = time.time()
rep = net.forwardImage(alignedFace)
if args.verbose:
2015-10-12 23:30:29 +08:00
print(" + OpenFace forward pass took {} seconds.".format(time.time() - start))
print("Representation:")
print(rep)
print("-----\n")
2015-09-30 06:07:12 +08:00
return rep
for (img1, img2) in itertools.combinations(args.imgs, 2):
d = getRep(img1) - getRep(img2)
print("Comparing {} with {}.".format(img1, img2))
print(" + Squared l2 distance between representations: {:0.3f}".format(np.dot(d, d)))