嵌入式工程师AI挑战营RV1106人脸识别+流水记录（7）PC推理

90houyidai 发表于 2025-1-11 21:31

接上回，Y轴坐标偏移问题已找到，问题出在对输入图片的尺寸处理上

模型输入尺寸是640，640的，图片需要进行缩放后放入模型推理，得到输入结果后也需要按照原来图片的尺寸进行放大还原

<pre>
<code>#
import os
import sys
import urllib
import urllib.request
import time
import numpy as np
import cv2

import insightface
from insightface.app import FaceAnalysis
from common import Face
from image import get_image as ins_get_image

from math import ceil
from itertools import product as product

from rknn.api import RKNN
DATASET_PATH = './dataset.txt'
DEFAULT_QUANT = True

def letterbox_resize(image, size, bg_color):
"""
letterbox_resize the image according to the specified size
:param image: input image, which can be a NumPy array or file path
:param size: target size (width, height)
:param bg_color: background filling data
:return: processed image
"""
if isinstance(image, str):
 image = cv2.imread(image)

target_width, target_height = size
image_height, image_width, _ = image.shape

# 计算调整后的图像尺寸
aspect_ratio = min(target_width / image_width, target_height / image_height)
new_width = int(image_width * aspect_ratio)
new_height = int(image_height * aspect_ratio)

# 使用 cv2.resize() 进行等比缩放
image = cv2.resize(image, (new_width, new_height), interpolation=cv2.INTER_AREA)

# 创建新的画布并进行填充
result_image = np.ones((target_height, target_width, 3), dtype=np.uint8) * bg_color
offset_x = (target_width - new_width) // 2
offset_y = (target_height - new_height) // 2
result_image = image
return result_image, aspect_ratio, offset_x, offset_y

def PriorBox(image_size): #image_size Support (320,320) and (640,640)
anchors = []
min_sizes = [, , ]
steps =
feature_maps = [ / step), ceil(image_size / step)] for step in steps]
for k, f in enumerate(feature_maps):
 min_sizes_ = min_sizes
 for i, j in product(range(f), range(f)):
 for min_size in min_sizes_:
 s_kx = min_size / image_size
 s_ky = min_size / image_size
 dense_cx = / image_size for x in ]
 dense_cy = / image_size for y in ]
 for cy, cx in product(dense_cy, dense_cx):
 anchors +=
output = np.array(anchors).reshape(-1, 4)
print("image_size:",image_size," num_priors=",output.shape)
return output

def box_decode(loc, priors):
"""Decode locations from predictions using priors to undo
the encoding we did for offset regression at train time.
Args:
 loc (tensor): location predictions for loc layers,
 Shape:
 priors (tensor): Prior boxes in center-offset form.
 Shape: .
 variances: (list) Variances of priorboxes
Return:
 decoded bounding box predictions
"""
variances =
boxes = np.concatenate((
 priors[:, :2] + loc[:, :2] * variances * priors[:, 2:],
 priors[:, 2:] * np.exp(loc[:, 2:] * variances)), axis=1)
boxes[:, :2] -= boxes[:, 2:] / 2
boxes[:, 2:] += boxes[:, :2]
return boxes

def decode_landm(pre, priors):
"""Decode landm from predictions using priors to undo
the encoding we did for offset regression at train time.
Args:
 pre (tensor): landm predictions for loc layers,
 Shape:
 priors (tensor): Prior boxes in center-offset form.
 Shape: .
 variances: (list) Variances of priorboxes
Return:
 decoded landm predictions
"""
variances =
landmarks = np.concatenate((
 priors[:, :2] + pre[:, :2] * variances * priors[:, 2:],
 priors[:, :2] + pre[:, 2:4] * variances * priors[:, 2:],
 priors[:, :2] + pre[:, 4:6] * variances * priors[:, 2:],
 priors[:, :2] + pre[:, 6:8] * variances * priors[:, 2:],
 priors[:, :2] + pre[:, 8:10] * variances * priors[:, 2:]
), axis=1)
return landmarks

def nms(dets, thresh):
"""Pure Python NMS baseline."""
x1 = dets[:, 0]
y1 = dets[:, 1]
x2 = dets[:, 2]
y2 = dets[:, 3]
scores = dets[:, 4]

areas = (x2 - x1 + 1) * (y2 - y1 + 1)
order = scores.argsort()[::-1]

keep = []
while order.size > 0:
 i = order
 keep.append(i)
 xx1 = np.maximum(x1, x1])
 yy1 = np.maximum(y1, y1])
 xx2 = np.minimum(x2, x2])
 yy2 = np.minimum(y2, y2])

 w = np.maximum(0.0, xx2 - xx1 + 1)
 h = np.maximum(0.0, yy2 - yy1 + 1)
 inter = w * h
 ovr = inter / (areas + areas] - inter)

 inds = np.where(ovr <= thresh)
 order = order

return keep

def distance2bbox(points, distance, max_shape=None):
"""Decode distance prediction to bounding box.

Args:
 points (Tensor): Shape (n, 2), .
 distance (Tensor): Distance from the given point to 4
 boundaries (left, top, right, bottom).
 max_shape (tuple): Shape of the image.

Returns:
 Tensor: Decoded bboxes.
"""
x1 = points[:, 0] - distance[:, 0]
y1 = points[:, 1] - distance[:, 1]
x2 = points[:, 0] + distance[:, 2]
y2 = points[:, 1] + distance[:, 3]
if max_shape is not None:
 x1 = x1.clamp(min=0, max=max_shape)
 y1 = y1.clamp(min=0, max=max_shape)
 x2 = x2.clamp(min=0, max=max_shape)
 y2 = y2.clamp(min=0, max=max_shape)
return np.stack(, axis=-1)

def distance2kps(points, distance, max_shape=None):
"""Decode distance prediction to bounding box.

Args:
 points (Tensor): Shape (n, 2), .
 distance (Tensor): Distance from the given point to 4
 boundaries (left, top, right, bottom).
 max_shape (tuple): Shape of the image.

Returns:
 Tensor: Decoded bboxes.
"""
preds = []
for i in range(0, distance.shape, 2):
 px = points[:, i%2] + distance[:, i]
 py = points[:, i%2+1] + distance[:, i+1]
 if max_shape is not None:
 px = px.clamp(min=0, max=max_shape)
 py = py.clamp(min=0, max=max_shape)
 preds.append(px)
 preds.append(py)
return np.stack(preds, axis=-1)

def draw_on(img, faces):
import cv2
dimg = img.copy()
for i in range(len(faces)):
 face = faces
 box = face.bbox.astype(int)
 color = (0, 0, 255)
 cv2.rectangle(dimg, (box, box), (box, box), color, 2)
 if face.kps is not None:
 kps = face.kps.astype(int)
 #print(landmark.shape)
 for l in range(kps.shape):
 color = (0, 0, 255)
 if l == 0 or l == 3:
 color = (0, 255, 0)
 cv2.circle(dimg, (kps, kps), 1, color,
 2)
 if face.gender is not None and face.age is not None:
 cv2.putText(dimg,'%s,%d'%(face.sex,face.age), (box-1, box-4),cv2.FONT_HERSHEY_COMPLEX,0.7,(0,255,0),1)

 #for key, value in face.items():
 # if key.startswith('landmark_3d'):
 # print(key, value.shape)
 # print(value)
 # lmk = np.round(value).astype(int)
 # for l in range(lmk.shape):
 # color = (255, 0, 0)
 # cv2.circle(dimg, (lmk, lmk), 1, color,
 # 2)
return dimg


if __name__ == '__main__':
# 创建RKNN对象
rknn = RKNN()

# 预处理设置
print('--> Config model')
'''
rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",
 quantized_algorithm="normal",dynamic_input=[[]], quant_img_RGB2BGR=True,remove_reshape=True,remove_weight=True,model_pruning=True)# mmse
'''
rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",
 quantized_algorithm="normal",dynamic_input=[[]],
 quant_img_RGB2BGR=False,remove_reshape=False,remove_weight=False,model_pruning=True)# mmse
print('done')

# 载入模型
print('--> Loading model')
ret = rknn.load_onnx(model="./det_10g.onnx")#,input_size_list=[])
if ret != 0:
 print('Load model failed!')
 exit(ret)
print('done')

# 创建模型
print('--> Building model')
ret = rknn.build(do_quantization=True, dataset=DATASET_PATH)#,rknn_batch_size=1)
if ret != 0:
 print('Build model failed!')
 exit(ret)
print('done')

# 输入图像
'''
img = cv2.imread('./test.jpg')
img_height, img_width, _ = img.shape
model_height, model_width = (640, 640)
letterbox_img, aspect_ratio, offset_x, offset_y = letterbox_resize(img, (model_height,model_width), 114)# letterbox缩放
infer_img = letterbox_img[..., ::-1]# BGR2RGB
infer_img = np.expand_dims(infer_img, 0)
print(infer_img.shape)

'''
'''
img = cv2.imread('./test.jpg')
#img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
img = cv2.resize(img,(640,640))
infer_img = np.expand_dims(img, 0)

'''
img = cv2.imread('./test.jpg')
input_size=(640,640)
im_ratio = float(img.shape) / img.shape
model_ratio = float(input_size) / input_size
if im_ratio>model_ratio:
 new_height = input_size
 new_width = int(new_height / im_ratio)
else:
 new_width = input_size
 new_height = int(new_width * im_ratio)
det_scale = float(new_height) / img.shape
print(new_width,new_height)
resized_img = cv2.resize(img, (new_width, new_height))
det_img = np.zeros( (input_size, input_size, 3), dtype=np.uint8 )
det_img[:new_height, :new_width, :] = resized_img
infer_img=np.expand_dims(det_img, 0)

# 初始化运行时环境
print('--> Init runtime environment')
ret = rknn.init_runtime()
if ret != 0:
 print('Init runtime environment failed!')
 exit(ret)
print('done')

# 运行
print('--> Running model')
'''
outputs = rknn.inference(inputs=, data_format=['nhwc'])
np.save('./onnx_resnet50v2_0.npy', outputs)
x = outputs
output = np.exp(x)/np.sum(np.exp(x))
outputs =
show_outputs(outputs)
print('done')
'''

outputs = rknn.inference(inputs=)#, data_format=['nhwc'])
#print (outputs)
scores_list = []
bboxes_list = []
kpss_list = []
print("forward-------------------")
input_height = 640
input_width = 640
fmc = 3
threshold=0.5
feat_stride_fpn=
num_anchors = 2
for idx, stride in enumerate(feat_stride_fpn):
 scores = outputs
 bbox_preds = outputs
 bbox_preds = bbox_preds * stride
 kps_preds = outputs * stride
 height = input_height // stride
 width = input_width // stride
 K = height * width
 key = (height, width, stride)
 center_cache = {}
 if key in center_cache:
 anchor_centers = center_cache
 else:
 #solution-1, c style:
 #anchor_centers = np.zeros( (height, width, 2), dtype=np.float32 )
 #for i in range(height):
 # anchor_centers = i
 #for i in range(width):
 # anchor_centers[:, i, 0] = i

 #solution-2:
 #ax = np.arange(width, dtype=np.float32)
 #ay = np.arange(height, dtype=np.float32)
 #xv, yv = np.meshgrid(np.arange(width), np.arange(height))
 #anchor_centers = np.stack(, axis=-1).astype(np.float32)

 #solution-3:
 anchor_centers = np.stack(np.mgrid[:height, :width][::-1], axis=-1).astype(np.float32)
 #print(anchor_centers.shape)

 anchor_centers = (anchor_centers * stride).reshape( (-1, 2) )
 if num_anchors>1:
 anchor_centers = np.stack(*num_anchors, axis=1).reshape( (-1,2) )
 if len(center_cache)<100:
 center_cache = anchor_centers

 pos_inds = np.where(scores>=threshold)
 print(stride,pos_inds,scores,threshold)
 bboxes = distance2bbox(anchor_centers, bbox_preds)

 pos_scores = scores
 pos_bboxes = bboxes
 #print(stride,pos_inds,pos_bboxes)
 scores_list.append(pos_scores)
 bboxes_list.append(pos_bboxes)

 kpss = distance2kps(anchor_centers, kps_preds)
 #kpss = kps_preds
 kpss = kpss.reshape( (kpss.shape, -1, 2) )
 pos_kpss = kpss
 kpss_list.append(pos_kpss)
#self.forward
print("bboxes_list---------------")
print (bboxes_list)
'''
print("scores_list---------------")
print (scores_list)
print("bboxes_list---------------")
print (bboxes_list)
print("kpss_list-----------------")
print (kpss_list)
print("-----------------------")
'''
det_scale=0.5
scores = np.vstack(scores_list)
scores_ravel = scores.ravel()
order = scores_ravel.argsort()[::-1]
bboxes = np.vstack(bboxes_list) / det_scale

kpss = np.vstack(kpss_list) / det_scale
pre_det = np.hstack((bboxes, scores)).astype(np.float32, copy=False)
pre_det = pre_det
keep = nms(pre_det,0.4)
det = pre_det

kpss = kpss
kpss = kpss
max_num = 0
print (max_num,det.shape)
if max_num > 0 and det.shape > max_num:
 area = (det[:, 2] - det[:, 0]) * (det[:, 3] -
 det[:, 1])
 img_center = img.shape // 2, img.shape // 2
 offsets = np.vstack([
 (det[:, 0] + det[:, 2]) / 2 - img_center,
 (det[:, 1] + det[:, 3]) / 2 - img_center
 ])
 offset_dist_squared = np.sum(np.power(offsets, 2.0), 0)
 if metric=='max':
 values = area
 else:
 values = area - offset_dist_squared * 2.0# some extra weight on the centering
 bindex = np.argsort(
 values)[::-1]# some extra weight on the centering
 bindex = bindex
 det = det
 if kpss is not None:
 kpss = kpss
#self.det_model.detect

bboxes = det
kpss= kpss
print("bboxes-------------------")
print(bboxes)
print("kpss-------------------")
print(kpss)
'''
if bboxes.shape == 0:
 return []
'''
ret = []
for i in range(bboxes.shape):
 bbox = bboxes
 det_score = bboxes
 kps = None
 if kpss is not None:
 kps = kpss
 face = Face(bbox=bbox, kps=kps, det_score=det_score)
 '''
 for taskname, model in self.models.items():
 if taskname=='detection':
 continue
 model.get(img, face)
 '''
 #model.get(img, face)
 ret.append(face)
print("ret---------------")
print (ret)
faces = ret
img = cv2.imread('./test.jpg')
rimg = draw_on(img, faces)
cv2.imwrite("./ldh_output1.jpg", rimg)

'''
#loc, conf, landmarks ,= outputs #获取输出数据
bboxes, kpss = outputs #获取输出数据

priors = PriorBox(image_size=(model_height, model_width)) # 获取先验框
boxes = box_decode(loc.squeeze(0), priors) # 解码输出数据

# letterbox
scale = np.array([model_width, model_height,
 model_width, model_height])
boxes = boxes * scale // 1# face box
boxes[...,0::2] =np.clip((boxes[...,0::2] - offset_x) / aspect_ratio, 0, img_width)#letterbox
boxes[...,1::2] =np.clip((boxes[...,1::2] - offset_y) / aspect_ratio, 0, img_height) #letterbox
scores = conf.squeeze(0)[:, 1]# 人脸检测的置信度
landmarks = decode_landm(landmarks.squeeze(
 0), priors)# face keypoint data
scale_landmarks = np.array([model_width, model_height, model_width, model_height,
 model_width, model_height, model_width, model_height,
 model_width, model_height])
landmarks = landmarks * scale_landmarks // 1
landmarks[...,0::2] = np.clip((landmarks[...,0::2] - offset_x) / aspect_ratio, 0, img_width) #letterbox
landmarks[...,1::2] = np.clip((landmarks[...,1::2] - offset_y) / aspect_ratio, 0, img_height) #letterbox

# 丢弃置信度过低的部分
inds = np.where(scores > 0.5)
boxes = boxes
landmarks = landmarks
scores = scores

order = scores.argsort()[::-1]
boxes = boxes
landmarks = landmarks
scores = scores

# 非极大值抑制
dets = np.hstack((boxes, scores[:, np.newaxis])).astype(
 np.float32, copy=False)
keep = nms(dets, 0.2)
dets = dets
landmarks = landmarks
dets = np.concatenate((dets, landmarks), axis=1)

# 画框标记
for data in dets:
 if data < 0.5:
 continue
 #print("face @ (%d %d %d %d) %f"%(data, data, data, data, data))
 text = "{:.4f}".format(data)
 data = list(map(int, data))
 cv2.rectangle(img, (data, data),
 (data, data), (0, 0, 255), 2)
 cx = data
 cy = data + 12
 cv2.putText(img, text, (cx, cy),
 cv2.FONT_HERSHEY_DUPLEX, 0.5, (255, 255, 255))
 # landmarks
 cv2.circle(img, (data, data), 1, (0, 0, 255), 5)
 cv2.circle(img, (data, data), 1, (0, 255, 255), 5)
 cv2.circle(img, (data, data), 1, (255, 0, 255), 5)
 cv2.circle(img, (data, data), 1, (0, 255, 0), 5)
 cv2.circle(img, (data, data), 1, (255, 0, 0), 5)
img_path = './result.jpg'
cv2.imwrite(img_path, img)
print("save image in", img_path)
'''
# 释放
rknn.release()</code></pre>

至此，人脸识别并标注mark点就OK了

同样的方法，将insightface\python-package中文件放入rknn中，并将model_zoo文件中对于模型的初始化、推理等按照RKNN模型修改也能得到相同的结果

我测试了retinaface和arcface两个模型，将这两个模型对应的python文件进行修改，使用FaceAnalysis也是可以使用的

retinaface模型的python文件

<pre>
<code># -*- coding: utf-8 -*-
# @Organization: insightface.ai
# <a href="home.php?mod=space&uid=1315547" target="_blank">@author </a> : Jia Guo
# <a href="home.php?mod=space&uid=39660" target="_blank">@time </a> : 2021-09-18
# <a href="home.php?mod=space&uid=665173" target="_blank">@FUNCTION </a> :

from __future__ import division
import datetime
import numpy as np
import onnx
import onnxruntime
import os
import os.path as osp
import cv2
import sys

DATASET_PATH = './dataset.txt'
DEFAULT_QUANT = True

def softmax(z):
assert len(z.shape) == 2
s = np.max(z, axis=1)
s = s[:, np.newaxis] # necessary step to do broadcasting
e_x = np.exp(z - s)
div = np.sum(e_x, axis=1)
div = div[:, np.newaxis] # dito
return e_x / div

def distance2bbox(points, distance, max_shape=None):
"""Decode distance prediction to bounding box.

Args:
 points (Tensor): Shape (n, 2), .
 distance (Tensor): Distance from the given point to 4
 boundaries (left, top, right, bottom).
 max_shape (tuple): Shape of the image.

Returns:
 Tensor: Decoded bboxes.
"""
x1 = points[:, 0] - distance[:, 0]
y1 = points[:, 1] - distance[:, 1]
x2 = points[:, 0] + distance[:, 2]
y2 = points[:, 1] + distance[:, 3]
if max_shape is not None:
 x1 = x1.clamp(min=0, max=max_shape)
 y1 = y1.clamp(min=0, max=max_shape)
 x2 = x2.clamp(min=0, max=max_shape)
 y2 = y2.clamp(min=0, max=max_shape)
return np.stack(, axis=-1)

def distance2kps(points, distance, max_shape=None):
"""Decode distance prediction to bounding box.

Args:
 points (Tensor): Shape (n, 2), .
 distance (Tensor): Distance from the given point to 4
 boundaries (left, top, right, bottom).
 max_shape (tuple): Shape of the image.

Returns:
 Tensor: Decoded bboxes.
"""
preds = []
for i in range(0, distance.shape, 2):
 px = points[:, i%2] + distance[:, i]
 py = points[:, i%2+1] + distance[:, i+1]
 if max_shape is not None:
 px = px.clamp(min=0, max=max_shape)
 py = py.clamp(min=0, max=max_shape)
 preds.append(px)
 preds.append(py)
return np.stack(preds, axis=-1)

class RetinaFace:
def __init__(self, model_file=None, session=None):
 import onnxruntime

 self.model_file = model_file
 self.session = session
 self.taskname = 'detection'
 if self.session is None:
 assert self.model_file is not None
 assert osp.exists(self.model_file)
 self.session = onnxruntime.InferenceSession(self.model_file, None)

 self.center_cache = {}
 self.nms_thresh = 0.4
 self.det_thresh = 0.5
 self._init_vars()

def _init_vars(self):
 input_cfg = self.session.get_inputs()
 input_shape = input_cfg.shape
 print(input_shape)
 if isinstance(input_shape, str):
 self.input_size = None
 else:
 self.input_size = tuple(input_shape[::-1])
 #print('image_size:', self.image_size)
 input_name = input_cfg.name
 self.input_shape = input_shape
 outputs = self.session.get_outputs()
 output_names = []
 for o in outputs:
 output_names.append(o.name)
 self.input_name = input_name
 self.output_names = output_names
 self.input_mean = 127.5
 self.input_std = 128.0
 print(self.output_names)
 #assert len(outputs)==10 or len(outputs)==15
 self.use_kps = False
 self._anchor_ratio = 1.0
 self._num_anchors = 1
 if len(outputs)==6:
 self.fmc = 3
 self._feat_stride_fpn =
 self._num_anchors = 2
 elif len(outputs)==9:
 self.fmc = 3
 self._feat_stride_fpn =
 self._num_anchors = 2
 self.use_kps = True
 elif len(outputs)==10:
 self.fmc = 5
 self._feat_stride_fpn =
 self._num_anchors = 1
 elif len(outputs)==15:
 self.fmc = 5
 self._feat_stride_fpn =
 self._num_anchors = 1
 self.use_kps = True

def prepare(self, ctx_id, **kwargs):
 if ctx_id<0:
 self.session.set_providers(['CPUExecutionProvider'])
 nms_thresh = kwargs.get('nms_thresh', None)
 if nms_thresh is not None:
 self.nms_thresh = nms_thresh
 det_thresh = kwargs.get('det_thresh', None)
 if det_thresh is not None:
 self.det_thresh = det_thresh
 input_size = kwargs.get('input_size', None)
 if input_size is not None:
 if self.input_size is not None:
 print('warning: det_size is already set in detection model, ignore')
 else:
 self.input_size = input_size
 from rknn.api import RKNN
 # 创建RKNN对象
 self.rknn = RKNN()
 # 预处理设置
 print('--> Config model')
 '''
rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",
 quantized_algorithm="normal",dynamic_input=[[]], quant_img_RGB2BGR=True,remove_reshape=True,remove_weight=True,model_pruning=True)# mmse
 '''
 self.rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",quantized_algorithm="normal",dynamic_input=[[]],quant_img_RGB2BGR=False,remove_reshape=False,remove_weight=False,model_pruning=True)# mmse
 print('done')
 # 载入模型
 print('--> Loading model')
 ret = self.rknn.load_onnx(model="./det_10g.onnx")#,input_size_list=[])
 if ret != 0:
 print('Load model failed!')
 exit(ret)
 print('done')
 # 创建模型
 print('--> Building model')
 ret = self.rknn.build(do_quantization=True, dataset=DATASET_PATH)#,rknn_batch_size=1)
 if ret != 0:
 print('Build model failed!')
 exit(ret)
 print('done')
 # 初始化运行时环境
 print('--> Init runtime environment')
 ret = self.rknn.init_runtime()
 if ret != 0:
 print('Init runtime environment failed!')
 exit(ret)
 print('done')

def forward(self, img, threshold):
 print("forward")
 scores_list = []
 bboxes_list = []
 kpss_list = []
 input_size = tuple(img.shape[::-1])
 #net_outs = self.rknn.inference(inputs=)
 blob = cv2.dnn.blobFromImage(img, 1.0/self.input_std, input_size, (self.input_mean, self.input_mean, self.input_mean), swapRB=True)
 #net_outs = self.session.run(self.output_names, {self.input_name : blob})
 infer_img=np.expand_dims(img, 0)
 net_outs = self.rknn.inference(inputs=infer_img)
 # 释放
 self.rknn.release()
 input_height = blob.shape
 input_width = blob.shape
 fmc = self.fmc
 for idx, stride in enumerate(self._feat_stride_fpn):
 scores = net_outs
 bbox_preds = net_outs
 bbox_preds = bbox_preds * stride
 if self.use_kps:
 kps_preds = net_outs * stride
 height = input_height // stride
 width = input_width // stride
 K = height * width
 key = (height, width, stride)
 if key in self.center_cache:
 anchor_centers = self.center_cache
 else:
 #solution-1, c style:
 #anchor_centers = np.zeros( (height, width, 2), dtype=np.float32 )
 #for i in range(height):
 # anchor_centers = i
 #for i in range(width):
 # anchor_centers[:, i, 0] = i

 #solution-2:
 #ax = np.arange(width, dtype=np.float32)
 #ay = np.arange(height, dtype=np.float32)
 #xv, yv = np.meshgrid(np.arange(width), np.arange(height))
 #anchor_centers = np.stack(, axis=-1).astype(np.float32)

 #solution-3:
 anchor_centers = np.stack(np.mgrid[:height, :width][::-1], axis=-1).astype(np.float32)
 #print(anchor_centers.shape)

 anchor_centers = (anchor_centers * stride).reshape( (-1, 2) )
 if self._num_anchors>1:
 anchor_centers = np.stack(*self._num_anchors, axis=1).reshape( (-1,2) )
 if len(self.center_cache)<100:
 self.center_cache = anchor_centers

 pos_inds = np.where(scores>=threshold)
 bboxes = distance2bbox(anchor_centers, bbox_preds)
 pos_scores = scores
 pos_bboxes = bboxes
 scores_list.append(pos_scores)
 bboxes_list.append(pos_bboxes)
 if self.use_kps:
 kpss = distance2kps(anchor_centers, kps_preds)
 #kpss = kps_preds
 kpss = kpss.reshape( (kpss.shape, -1, 2) )
 pos_kpss = kpss
 kpss_list.append(pos_kpss)
 return scores_list, bboxes_list, kpss_list

def detect(self, img, input_size = None, max_num=0, metric='default'):
 assert input_size is not None or self.input_size is not None
 input_size = self.input_size if input_size is None else input_size

 im_ratio = float(img.shape) / img.shape
 model_ratio = float(input_size) / input_size
 if im_ratio>model_ratio:
 new_height = input_size
 new_width = int(new_height / im_ratio)
 else:
 new_width = input_size
 new_height = int(new_width * im_ratio)
 det_scale = float(new_height) / img.shape
 resized_img = cv2.resize(img, (new_width, new_height))
 det_img = np.zeros( (input_size, input_size, 3), dtype=np.uint8 )
 det_img[:new_height, :new_width, :] = resized_img

 scores_list, bboxes_list, kpss_list = self.forward(det_img, self.det_thresh)

 scores = np.vstack(scores_list)
 scores_ravel = scores.ravel()
 order = scores_ravel.argsort()[::-1]
 bboxes = np.vstack(bboxes_list) / det_scale
 if self.use_kps:
 kpss = np.vstack(kpss_list) / det_scale
 pre_det = np.hstack((bboxes, scores)).astype(np.float32, copy=False)
 pre_det = pre_det
 keep = self.nms(pre_det)
 det = pre_det
 if self.use_kps:
 kpss = kpss
 kpss = kpss
 else:
 kpss = None
 if max_num > 0 and det.shape > max_num:
 area = (det[:, 2] - det[:, 0]) * (det[:, 3] -
 det[:, 1])
 img_center = img.shape // 2, img.shape // 2
 offsets = np.vstack([
 (det[:, 0] + det[:, 2]) / 2 - img_center,
 (det[:, 1] + det[:, 3]) / 2 - img_center
 ])
 offset_dist_squared = np.sum(np.power(offsets, 2.0), 0)
 if metric=='max':
 values = area
 else:
 values = area - offset_dist_squared * 2.0# some extra weight on the centering
 bindex = np.argsort(
 values)[::-1]# some extra weight on the centering
 bindex = bindex
 det = det
 if kpss is not None:
 kpss = kpss
 return det, kpss

def nms(self, dets):
 thresh = self.nms_thresh
 x1 = dets[:, 0]
 y1 = dets[:, 1]
 x2 = dets[:, 2]
 y2 = dets[:, 3]
 scores = dets[:, 4]

 areas = (x2 - x1 + 1) * (y2 - y1 + 1)
 order = scores.argsort()[::-1]

 keep = []
 while order.size > 0:
 i = order
 keep.append(i)
 xx1 = np.maximum(x1, x1])
 yy1 = np.maximum(y1, y1])
 xx2 = np.minimum(x2, x2])
 yy2 = np.minimum(y2, y2])

 w = np.maximum(0.0, xx2 - xx1 + 1)
 h = np.maximum(0.0, yy2 - yy1 + 1)
 inter = w * h
 ovr = inter / (areas + areas] - inter)

 inds = np.where(ovr <= thresh)
 order = order

 return keep

def get_retinaface(name, download=False, root='~/.insightface/models', **kwargs):
print("get---------------------")
if not download:
 assert os.path.exists(name)
 return RetinaFace(name)
else:
 from .model_store import get_model_file
 _file = get_model_file("retinaface_%s" % name, root=root)
 return retinaface(_file)

</code></pre>

 

 

arcFace模型python文件

<pre>
<code># -*- coding: utf-8 -*-
# @Organization: insightface.ai
# @Author : Jia Guo
# @Time : 2021-05-04
# @Function :

from __future__ import division
import numpy as np
import cv2
import onnx
import onnxruntime
from ..utils import face_align

DATASET_PATH = './dataset.txt'
DEFAULT_QUANT = True

__all__ = [
'ArcFaceONNX',
]

class ArcFaceONNX:
def __init__(self, model_file=None, session=None):
 assert model_file is not None

 self.model_file = model_file
 self.session = session
 self.taskname = 'recognition'
 find_sub = False
 find_mul = False
 model = onnx.load(self.model_file)
 #print(self.model_file)
 graph = model.graph
 for nid, node in enumerate(graph.node[:8]):
 #print(nid, node.name)
 if node.name.startswith('Sub') or node.name.startswith('_minus'):
 find_sub = True
 if node.name.startswith('Mul') or node.name.startswith('_mul'):
 find_mul = True
 if find_sub and find_mul:
 #mxnet arcface model
 input_mean = 0.0
 input_std = 1.0
 else:
 input_mean = 127.5
 input_std = 127.5
 self.input_mean = input_mean
 self.input_std = input_std
 #print('input mean and std:', self.input_mean, self.input_std)
 if self.session is None:
 self.session = onnxruntime.InferenceSession(self.model_file, None)

 input_cfg = self.session.get_inputs()
 input_shape = input_cfg.shape
 input_name = input_cfg.name
 self.input_size = tuple(input_shape[::-1])
 self.input_shape = input_shape
 outputs = self.session.get_outputs()
 output_names = []
 for out in outputs:
 output_names.append(out.name)
 self.input_name = input_name
 self.output_names = output_names
 assert len(self.output_names)==1
 self.output_shape = outputs.shape

def prepare(self, ctx_id, **kwargs):
 if ctx_id<0:
 self.session.set_providers(['CPUExecutionProvider'])
 from rknn.api import RKNN
 # 创建RKNN对象
 self.rknn = RKNN()
 # 预处理设置
 print('--> Config model')
 '''
rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",
 quantized_algorithm="normal",dynamic_input=[[]], quant_img_RGB2BGR=True,remove_reshape=True,remove_weight=True,model_pruning=True)# mmse
 '''
 self.rknn.config(mean_values=[], std_values=[], target_platform="rv1106b",quantized_algorithm="normal",dynamic_input=[[]],quant_img_RGB2BGR=False,remove_reshape=False,remove_weight=False,model_pruning=True)# mmse
 print('done')
 # 载入模型
 print('--> Loading model')
 ret = self.rknn.load_onnx(model=self.model_file)#,input_size_list=[])
 if ret != 0:
 print('Load model failed!')
 exit(ret)
 print('done')
 # 创建模型
 print('--> Building model')
 ret = self.rknn.build(do_quantization=True, dataset=DATASET_PATH)#,rknn_batch_size=1)
 if ret != 0:
 print('Build model failed!')
 exit(ret)
 print('done')
 # 初始化运行时环境
 print('--> Init runtime environment')
 ret = self.rknn.init_runtime()
 if ret != 0:
 print('Init runtime environment failed!')
 exit(ret)
 print('done')

def get(self, img, face):
 aimg = face_align.norm_crop(img, landmark=face.kps, image_size=self.input_size)
 #face.embedding = self.get_feat(aimg).flatten()
 face.embedding = self.get_feat(aimg)
 return face.embedding

def compute_sim(self, feat1, feat2):
 from numpy.linalg import norm
 feat1 = feat1.ravel()
 feat2 = feat2.ravel()
 sim = np.dot(feat1, feat2) / (norm(feat1) * norm(feat2))
 return sim

def get_feat(self, imgs):
 '''
 if not isinstance(imgs, list):
 imgs =
 input_size = self.input_size

 blob = cv2.dnn.blobFromImages(imgs, 1.0 / self.input_std, input_size,
 (self.input_mean, self.input_mean, self.input_mean), swapRB=True)
 net_out = self.session.run(self.output_names, {self.input_name: blob})
 '''
 infer_img=np.expand_dims(imgs, 0)
 net_out = self.rknn.inference(inputs=infer_img)
 net_outs=np.array(net_out).flatten()#.ravel()

 return net_outs

def forward(self, batch_data):
 #blob = (batch_data - self.input_mean) / self.input_std
 #net_out = self.session.run(self.output_names, {self.input_name: blob})
 infer_img=np.expand_dims(imgs, 0)
 net_outs = self.rknn.inference(inputs=infer_img)
 return net_out

</code></pre>

rknn下insigtface测试文件

<pre>
<code>import os
import sys
import urllib
import urllib.request
import time
import numpy as np
import cv2

import insightface
from insightface.app import FaceAnalysis
from insightface.data import get_image as ins_get_image

from math import ceil
from itertools import product as product

#from rknn.api import RKNN

# 运行
print('--> Running model')
#outputs = rknn.inference(inputs=)#, data_format=['nhwc'])

app = FaceAnalysis(allowed_modules=['detection'],providers=['CUDAExecutionProvider', 'CPUExecutionProvider'])
print("prepare::::")
app.prepare(ctx_id=0, det_size=(640, 640))
img = ins_get_image('t1')#不用带后缀，图片放到./insightface/python-package/insightface/data/images
faces = app.get(img)
print("size of faces:", len(faces))

app.prepare(ctx_id=0, det_size=(640, 640))
img1 = ins_get_image('face1')#不用带后缀，图片放到./insightface/python-package/insightface/data/images
faces1 = app.get(img1)
print("size of faces1:", len(faces1))
#print("faces::::", faces)
#rimg = app.draw_on(img, faces)
#cv2.imwrite("./output1.jpg", rimg)

handler = insightface.model_zoo.get_model('/home/ubuntu/.insightface/models/buffalo_l/w600k_r50.onnx', providers=['CUDAExecutionProvider', 'CPUExecutionProvider'])
handler.prepare(ctx_id=0)
img = ins_get_image('t1')
feature = handler.get(img, faces)
#print("size of feature:", len(feature))
print("feature:", feature)
sim = handler.compute_sim(feature,feature)
print("sim:", sim)

img1 = ins_get_image('face1')
feature1 = handler.get(img1, faces1)
for i in range(len(faces)):
feature = handler.get(img, faces)
sim = handler.compute_sim(feature,feature1)
print("sim:", i,sim)

</code></pre>

<div></div>

解压至/rknn-toolkit2/luckfox_rknn/scripts/luckfox_onnx_to_rknn/sim，配置好环境即可在PC上推理

tzq4 发表于 2025-1-18 00:55

您好请问这个

<pre id="code_0">
<code class="hljs python">from image import get_image as ins_get_image中image哪来的哇</code></pre>

90houyidai 发表于 2025-1-20 08:45

tzq4 发表于 2025-1-18 00:55
您好请问这个

from image import get_image as ins_get_image中image哪来的哇

<ul>
<li>from insightface.data import get_image as ins_get_image</li>
</ul>

90houyidai 发表于 2025-1-20 08:46

tzq4 发表于 2025-1-18 00:55
您好请问这个

from image import get_image as ins_get_image中image哪来的哇

调用insightface的python文件

页: [1]

电子工程世界-论坛's Archiver

嵌入式工程师AI挑战营RV1106人脸识别+流水记录（7）PC推理