Files
insightface/recognition/embedding.py

65 lines
2.1 KiB
Python
Raw Normal View History

2018-07-10 18:04:13 +08:00
import argparse
import cv2
import numpy as np
import sys
import mxnet as mx
import datetime
from skimage import transform as trans
import sklearn
from sklearn import preprocessing
class Embedding:
def __init__(self, prefix, epoch, ctx_id=0):
print('loading',prefix, epoch)
ctx = mx.gpu(ctx_id)
sym, arg_params, aux_params = mx.model.load_checkpoint(prefix, epoch)
all_layers = sym.get_internals()
sym = all_layers['fc1_output']
image_size = (112,112)
self.image_size = image_size
model = mx.mod.Module(symbol=sym, context=ctx, label_names = None)
#model = mx.mod.Module(symbol=sym, context=ctx)
model.bind(for_training=False, data_shapes=[('data', (1, 3, image_size[0], image_size[1]))])
model.set_params(arg_params, aux_params)
self.model = model
src = np.array([
[30.2946, 51.6963],
[65.5318, 51.5014],
[48.0252, 71.7366],
[33.5493, 92.3655],
[62.7299, 92.2041] ], dtype=np.float32 )
if image_size[1]==112:
src[:,0] += 8.0
self.src = src
def get(self, rimg, landmark):
2018-07-10 18:15:10 +08:00
assert landmark.shape[0]==68 or landmark.shape[0]==5
2018-07-10 18:04:13 +08:00
assert landmark.shape[1]==2
2018-07-10 18:15:10 +08:00
if landmark.shape[0]==68:
landmark5 = np.zeros( (5,2), dtype=np.float32 )
landmark5[0] = (landmark[36]+landmark[39])/2
landmark5[1] = (landmark[42]+landmark[45])/2
landmark5[2] = landmark[30]
landmark5[3] = landmark[48]
landmark5[4] = landmark[54]
else:
landmark5 = landmark
2018-07-10 18:04:13 +08:00
tform = trans.SimilarityTransform()
tform.estimate(landmark5, self.src)
M = tform.params[0:2,:]
img = cv2.warpAffine(rimg,M,(self.image_size[1],self.image_size[0]), borderValue = 0.0)
img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
img = np.transpose(img, (2,0,1)) #3*112*112, RGB
input_blob = np.zeros( (1, 3, self.image_size[1], self.image_size[0]),dtype=np.uint8 )
input_blob[0] = img
data = mx.nd.array(input_blob)
db = mx.io.DataBatch(data=(data,))
self.model.forward(db, is_train=False)
embedding = self.model.get_outputs()[0].asnumpy()
embedding = sklearn.preprocessing.normalize(embedding).flatten()
return embedding