ONNX
Yuantao Feng commited on
Commit
f40140c
·
1 Parent(s): bf10ae7

Update to OpenCV APIs (YuNet -> FaceDetectorYN, SFace -> FaceRecognizerSF) (#6)

Browse files
Files changed (2) hide show
  1. demo.py +4 -16
  2. sface.py +40 -136
demo.py CHANGED
@@ -35,14 +35,13 @@ args = parser.parse_args()
35
 
36
  if __name__ == '__main__':
37
  # Instantiate SFace for face recognition
38
- recognizer = SFace(modelPath=args.model)
39
  # Instantiate YuNet for face detection
40
  detector = YuNet(modelPath='../face_detection_yunet/face_detection_yunet.onnx',
41
  inputSize=[320, 320],
42
  confThreshold=0.9,
43
  nmsThreshold=0.3,
44
- topK=5000,
45
- keepTopK=750)
46
 
47
  img1 = cv.imread(args.input1)
48
  img2 = cv.imread(args.input2)
@@ -56,16 +55,5 @@ if __name__ == '__main__':
56
  assert face2.shape[0] > 0, 'Cannot find a face in {}'.format(args.input2)
57
 
58
  # Match
59
- distance = recognizer.match(img1, face1[0][:-1], img2, face2[0][:-1], args.dis_type)
60
- print(distance)
61
- if args.dis_type == 0:
62
- dis_type = 'Cosine'
63
- threshold = 0.363
64
- result = 'same identity' if distance >= threshold else 'different identity'
65
- elif args.dis_type == 1:
66
- dis_type = 'Norm-L2'
67
- threshold = 1.128
68
- result = 'same identity' if distance <= threshold else 'different identity'
69
- else:
70
- raise NotImplementedError()
71
- print('Using {} distance, threshold {}: {}.'.format(dis_type, threshold, result))
 
35
 
36
  if __name__ == '__main__':
37
  # Instantiate SFace for face recognition
38
+ recognizer = SFace(modelPath=args.model, disType=args.dis_type)
39
  # Instantiate YuNet for face detection
40
  detector = YuNet(modelPath='../face_detection_yunet/face_detection_yunet.onnx',
41
  inputSize=[320, 320],
42
  confThreshold=0.9,
43
  nmsThreshold=0.3,
44
+ topK=5000)
 
45
 
46
  img1 = cv.imread(args.input1)
47
  img2 = cv.imread(args.input2)
 
55
  assert face2.shape[0] > 0, 'Cannot find a face in {}'.format(args.input2)
56
 
57
  # Match
58
+ result = recognizer.match(img1, face1[0][:-1], img2, face2[0][:-1])
59
+ print('Result: {}.'.format('same identity' if result else 'different identities'))
 
 
 
 
 
 
 
 
 
 
 
sface.py CHANGED
@@ -10,156 +10,60 @@ import cv2 as cv
10
  from _testcapi import FLT_MIN
11
 
12
  class SFace:
13
- def __init__(self, modelPath):
14
- self._model = cv.dnn.readNet(modelPath)
15
- self._input_size = [112, 112]
16
- self._dst = np.array([
17
- [38.2946, 51.6963],
18
- [73.5318, 51.5014],
19
- [56.0252, 71.7366],
20
- [41.5493, 92.3655],
21
- [70.7299, 92.2041]
22
- ], dtype=np.float32)
23
- self._dst_mean = np.array([56.0262, 71.9008], dtype=np.float32)
 
 
 
 
24
 
25
  @property
26
  def name(self):
27
  return self.__class__.__name__
28
 
29
- def setBackend(self, backend_id):
30
- self._model.setPreferableBackend(backend_id)
31
-
32
- def setTarget(self, target_id):
33
- self._model.setPreferableTarget(target_id)
 
 
 
 
 
 
 
 
 
 
34
 
35
  def _preprocess(self, image, bbox):
36
- aligned_image = self._alignCrop(image, bbox)
37
- return cv.dnn.blobFromImage(aligned_image)
38
 
39
  def infer(self, image, bbox):
40
  # Preprocess
41
  inputBlob = self._preprocess(image, bbox)
42
 
43
  # Forward
44
- self._model.setInput(inputBlob)
45
- outputBlob = self._model.forward()
46
-
47
- # Postprocess
48
- results = self._postprocess(outputBlob)
49
-
50
- return results
51
 
52
- def _postprocess(self, outputBlob):
53
- return outputBlob / cv.norm(outputBlob)
54
-
55
- def match(self, image1, face1, image2, face2, dis_type=0):
56
  feature1 = self.infer(image1, face1)
57
  feature2 = self.infer(image2, face2)
58
 
59
- if dis_type == 0: # COSINE
60
- return np.sum(feature1 * feature2)
61
- elif dis_type == 1: # NORM_L2
62
- return cv.norm(feature1, feature2)
63
- else:
64
- raise NotImplementedError()
65
-
66
- def _alignCrop(self, image, face):
67
- # Retrieve landmarks
68
- if face.shape[-1] == (4 + 5 * 2):
69
- landmarks = face[4:].reshape(5, 2)
70
- else:
71
- raise NotImplementedError()
72
- warp_mat = self._getSimilarityTransformMatrix(landmarks)
73
- aligned_image = cv.warpAffine(image, warp_mat, self._input_size, flags=cv.INTER_LINEAR)
74
- return aligned_image
75
-
76
- def _getSimilarityTransformMatrix(self, src):
77
- # compute the mean of src and dst
78
- src_mean = np.array([np.mean(src[:, 0]), np.mean(src[:, 1])], dtype=np.float32)
79
- dst_mean = np.array([56.0262, 71.9008], dtype=np.float32)
80
- # subtract the means from src and dst
81
- src_demean = src.copy()
82
- src_demean[:, 0] = src_demean[:, 0] - src_mean[0]
83
- src_demean[:, 1] = src_demean[:, 1] - src_mean[1]
84
- dst_demean = self._dst.copy()
85
- dst_demean[:, 0] = dst_demean[:, 0] - dst_mean[0]
86
- dst_demean[:, 1] = dst_demean[:, 1] - dst_mean[1]
87
-
88
- A = np.array([[0., 0.], [0., 0.]], dtype=np.float64)
89
- for i in range(5):
90
- A[0][0] += dst_demean[i][0] * src_demean[i][0]
91
- A[0][1] += dst_demean[i][0] * src_demean[i][1]
92
- A[1][0] += dst_demean[i][1] * src_demean[i][0]
93
- A[1][1] += dst_demean[i][1] * src_demean[i][1]
94
- A = A / 5
95
-
96
- d = np.array([1.0, 1.0], dtype=np.float64)
97
- if A[0][0] * A[1][1] - A[0][1] * A[1][0] < 0:
98
- d[1] = -1
99
-
100
- T = np.array([
101
- [1.0, 0.0, 0.0],
102
- [0.0, 1.0, 0.0],
103
- [0.0, 0.0, 1.0]
104
- ], dtype=np.float64)
105
-
106
- s, u, vt = cv.SVDecomp(A)
107
- smax = s[0][0] if s[0][0] > s[1][0] else s[1][0]
108
- tol = smax * 2 * FLT_MIN
109
- rank = int(0)
110
- if s[0][0] > tol:
111
- rank += 1
112
- if s[1][0] > tol:
113
- rank += 1
114
- det_u = u[0][0] * u[1][1] - u[0][1] * u[1][0]
115
- det_vt = vt[0][0] * vt[1][1] - vt[0][1] * vt[1][0]
116
- if rank == 1:
117
- if det_u * det_vt > 0:
118
- uvt = np.matmul(u, vt)
119
- T[0][0] = uvt[0][0]
120
- T[0][1] = uvt[0][1]
121
- T[1][0] = uvt[1][0]
122
- T[1][1] = uvt[1][1]
123
- else:
124
- temp = d[1]
125
- d[1] = -1
126
- D = np.array([[d[0], 0.0], [0.0, d[1]]], dtype=np.float64)
127
- Dvt = np.matmul(D, vt)
128
- uDvt = np.matmul(u, Dvt)
129
- T[0][0] = uDvt[0][0]
130
- T[0][1] = uDvt[0][1]
131
- T[1][0] = uDvt[1][0]
132
- T[1][1] = uDvt[1][1]
133
- d[1] = temp
134
- else:
135
- D = np.array([[d[0], 0.0], [0.0, d[1]]], dtype=np.float64)
136
- Dvt = np.matmul(D, vt)
137
- uDvt = np.matmul(u, Dvt)
138
- T[0][0] = uDvt[0][0]
139
- T[0][1] = uDvt[0][1]
140
- T[1][0] = uDvt[1][0]
141
- T[1][1] = uDvt[1][1]
142
-
143
- var1 = 0.0
144
- var2 = 0.0
145
- for i in range(5):
146
- var1 += src_demean[i][0] * src_demean[i][0]
147
- var2 += src_demean[i][1] * src_demean[i][1]
148
- var1 /= 5
149
- var2 /= 5
150
-
151
- scale = 1.0 / (var1 + var2) * (s[0][0] * d[0] + s[1][0] * d[1])
152
- TS = [
153
- T[0][0] * src_mean[0] + T[0][1] * src_mean[1],
154
- T[1][0] * src_mean[0] + T[1][1] * src_mean[1]
155
- ]
156
- T[0][2] = dst_mean[0] - scale * TS[0]
157
- T[1][2] = dst_mean[1] - scale * TS[1]
158
- T[0][0] *= scale
159
- T[0][1] *= scale
160
- T[1][0] *= scale
161
- T[1][1] *= scale
162
- return np.array([
163
- [T[0][0], T[0][1], T[0][2]],
164
- [T[1][0], T[1][1], T[1][2]]
165
- ], dtype=np.float64)
 
10
  from _testcapi import FLT_MIN
11
 
12
  class SFace:
13
+ def __init__(self, modelPath, disType=0, backendId=0, targetId=0):
14
+ self._modelPath = modelPath
15
+ self._backendId = backendId
16
+ self._targetId = targetId
17
+ self._model = cv.FaceRecognizerSF.create(
18
+ model=self._modelPath,
19
+ config="",
20
+ backend_id=self._backendId,
21
+ target_id=self._targetId)
22
+
23
+ self._disType = disType # 0: cosine similarity, 1: Norm-L2 distance
24
+ assert self._disType in [0, 1], "0: Cosine similarity, 1: norm-L2 distance, others: invalid"
25
+
26
+ self._threshold_cosine = 0.363
27
+ self._threshold_norml2 = 1.128
28
 
29
  @property
30
  def name(self):
31
  return self.__class__.__name__
32
 
33
+ def setBackend(self, backendId):
34
+ self._backendId = backendId
35
+ self._model = cv.FaceRecognizerSF.create(
36
+ model=self._modelPath,
37
+ config="",
38
+ backend_id=self._backendId,
39
+ target_id=self._targetId)
40
+
41
+ def setTarget(self, targetId):
42
+ self._targetId = targetId
43
+ self._model = cv.FaceRecognizerSF.create(
44
+ model=self._modelPath,
45
+ config="",
46
+ backend_id=self._backendId,
47
+ target_id=self._targetId)
48
 
49
  def _preprocess(self, image, bbox):
50
+ return self._model.alignCrop(image, bbox)
 
51
 
52
  def infer(self, image, bbox):
53
  # Preprocess
54
  inputBlob = self._preprocess(image, bbox)
55
 
56
  # Forward
57
+ features = self._model.feature(inputBlob)
58
+ return features
 
 
 
 
 
59
 
60
+ def match(self, image1, face1, image2, face2):
 
 
 
61
  feature1 = self.infer(image1, face1)
62
  feature2 = self.infer(image2, face2)
63
 
64
+ if self._disType == 0: # COSINE
65
+ cosine_score = self._model.match(feature1, feature2, self._disType)
66
+ return 1 if cosine_score >= self._threshold_cosine else 0
67
+ else: # NORM_L2
68
+ norml2_distance = self._model.match(feature1, feature2, self._disType)
69
+ return 1 if norml2_distance <= self._threshold_norml2 else 0