weixin_54532612 2022-03-14 08:42 采纳率: 50%

已结题

mtcnn和facenet实现部分遮挡下的人脸识别

问题遇到的现象和发生背景

问题相关代码，请勿粘贴截图

运行结果及报错内容

我的解答思路和尝试过的方法

我想要达到的结果

对于这些代码我还不太清楚，希望可以帮我用中文详细注释一下代码，谢谢。
``

from facenet import MTCNN, InceptionResnetV1
from torchvision.transforms import functional as F
import numpy as np
import matplotlib.pyplot as plt
import cv2
from PIL import Image
from scipy.spatial.distance import canberra
from sklearn.preprocessing import Normalizer
import torch
import tkinter as tk
from tkinter.filedialog import askopenfilename
from PIL import Image, ImageTk

max_w_h = (700, 500)

def ShowImg(img, img_labels):
    rgba_img = cv2.cvtColor(img, cv2.COLOR_BGR2RGBA)
    show_img = Image.fromarray(rgba_img)
    show_img = ImageTk.PhotoImage(show_img)
    img_labels.config(image=show_img)
    img_labels.image = show_img

def Resize(img):
    h, w, _ = img.shape
    ratio = h / w
    if max_w_h[0] * ratio > max_w_h[1]:
        return cv2.resize(img, (int(max_w_h[1] / ratio), int(max_w_h[1])))
    else:
        return cv2.resize(img, (int(max_w_h[0]), int(max_w_h[0] * ratio)))

gpu = False
device = torch.device('cuda:0' if gpu & torch.cuda.is_available() else 'cpu')
print('Running on device: {}'.format(device))

# loading the facenet model
facerec = InceptionResnetV1(pretrained='vggface2').eval().to(device)

# Loading the mtcnn model
mtcnn = MTCNN(margin=30, device=device)
l2_encoder = Normalizer(norm='l2')

# load trained faces
data = np.load('data.npz')
trainx_embed, trainy = data['a'], data['b']

def calculate_distance(embedding, known_faces, known_labels):
    store = dict()
    for i in known_labels:
        if i not in store:
            store[i] = []
    for i in range(known_faces.shape[0]):
        store[known_labels[i]].append(canberra(embedding, known_faces[i]))
    for i in store.keys():
        store[i] = sum(store[i]) / len(store[i])
    dist = min(store.values())
    for i in store:
        if store[i] == dist:
            return (dist, i)

def run(imgp):
    try:
        img = Image.open(imgp)
        _, img_cropped, box = mtcnn(img)
        face_array = np.array(img_cropped)
        face_pixels = F.to_tensor(np.float32(face_array))
        face_pixels = (face_pixels - 127.5) / 128.0
        feas = facerec(face_pixels.unsqueeze(0).to(device))
        feas = feas.cpu().detach().numpy()
        distance, label = calculate_distance(feas, trainx_embed, trainy)
        print(label)
        # plot
        image = cv2.imread(imgp)
        if distance > 350:  # 368
            label = "UNKNOWN"
        p1, p2 = (int(box[0]), int(box[1])), (int(box[2]), int(box[3]))
        thickness = max(round(sum(image.shape) / 2 * 0.003), 2)
        cv2.rectangle(image, p1, p2, (0, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
        tf = max(thickness - 1, 1)  # font thickness
        w, h = cv2.getTextSize(label, 0, fontScale=thickness / 3, thickness=tf)[0]  # text width, height
        outside = p1[1] - h - 3 >= 0  # label fits outside box
        cv2.putText(image, label, (p1[0], p1[1] - 2 if outside else p1[1] + h + 2), 0, thickness / 3, (0, 255, 255),
                    thickness=tf, lineType=cv2.LINE_AA)
        data_img = Resize(image)
        ShowImg(data_img, img_l)
        img_l.update()
    except:
        print('Can not detect face!')

def select_img():
    path = askopenfilename()
    try:
        run(path)
    except:
        pass

if __name__ == '__main__':
    root = tk.Tk()
    root.title("Face Detection Demo")
    sc_width = root.winfo_screenwidth()
    sc_height = root.winfo_screenheight()
    WID = 600  # 窗口宽
    HEI = 600  # 窗口高
    root.geometry('%dx%d+%d+%d' % (WID, HEI, (sc_width - WID) / 2, (sc_height - HEI) / 2 - 30))
    type = ('宋体', "12", 'normal')

    up_frame = tk.Frame(root)
    tk.Button(up_frame, text='加载图片', command=select_img, font=type).pack(padx=1, side=tk.LEFT)
    tk.Button(up_frame, text='退出系统', command=root.destroy, font=type).pack(padx=1, side=tk.LEFT)
    up_frame.pack(pady=1, anchor='n')

    img_frame = tk.Frame(root)
    img_l = tk.Label(img_frame)
    img_l.pack()
    img_frame.pack(pady=20)
    root.mainloop()

展开全部

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

2条回答默认最新

CSDN专家-深度学习进阶 2022-03-15 01:05

关注

对应代码块后面#写了注释

from facenet import MTCNN, InceptionResnetV1             #导入各种需要用到的包
from torchvision.transforms import functional as F
import numpy as np
import matplotlib.pyplot as plt
import cv2
from PIL import Image
from scipy.spatial.distance import canberra
from sklearn.preprocessing import Normalizer
import torch
import tkinter as tk
from tkinter.filedialog import askopenfilename
from PIL import Image, ImageTk
 
max_w_h = (700, 500)
 
def ShowImg(img, img_labels):      #定义展示图片的函数
    rgba_img = cv2.cvtColor(img, cv2.COLOR_BGR2RGBA)
    show_img = Image.fromarray(rgba_img)
    show_img = ImageTk.PhotoImage(show_img)
    img_labels.config(image=show_img)
    img_labels.image = show_img
 
def Resize(img):                    #定义图片改变大小的函数
    h, w, _ = img.shape
    ratio = h / w
    if max_w_h[0] * ratio > max_w_h[1]:
        return cv2.resize(img, (int(max_w_h[1] / ratio), int(max_w_h[1])))
    else:
        return cv2.resize(img, (int(max_w_h[0]), int(max_w_h[0] * ratio)))
 
gpu = False
device = torch.device('cuda:0' if gpu & torch.cuda.is_available() else 'cpu')
print('Running on device: {}'.format(device))     #如果gpu可用就用gpu，否则使用CPU
 
# loading the facenet model
facerec = InceptionResnetV1(pretrained='vggface2').eval().to(device)    #加载facenet模型
 
# Loading the mtcnn model
mtcnn = MTCNN(margin=30, device=device)     #加载mtcnn模型
l2_encoder = Normalizer(norm='l2')
 
# load trained faces
data = np.load('data.npz')      #加载训练的数据
trainx_embed, trainy = data['a'], data['b']
 
def calculate_distance(embedding, known_faces, known_labels):  #定义计算距离的函数
    store = dict()
    for i in known_labels:
        if i not in store:
            store[i] = []
    for i in range(known_faces.shape[0]):
        store[known_labels[i]].append(canberra(embedding, known_faces[i]))
    for i in store.keys():
        store[i] = sum(store[i]) / len(store[i])
    dist = min(store.values())
    for i in store:
        if store[i] == dist:
            return (dist, i)
 
def run(imgp):        #定义运行的过程
    try:
        img = Image.open(imgp)
        _, img_cropped, box = mtcnn(img)
        face_array = np.array(img_cropped)
        face_pixels = F.to_tensor(np.float32(face_array))
        face_pixels = (face_pixels - 127.5) / 128.0
        feas = facerec(face_pixels.unsqueeze(0).to(device))
        feas = feas.cpu().detach().numpy()
        distance, label = calculate_distance(feas, trainx_embed, trainy)
        print(label)
        # plot
        image = cv2.imread(imgp)
        if distance > 350:  # 368
            label = "UNKNOWN"
        p1, p2 = (int(box[0]), int(box[1])), (int(box[2]), int(box[3]))
        thickness = max(round(sum(image.shape) / 2 * 0.003), 2)
        cv2.rectangle(image, p1, p2, (0, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
        tf = max(thickness - 1, 1)  # font thickness
        w, h = cv2.getTextSize(label, 0, fontScale=thickness / 3, thickness=tf)[0]  # text width, height
        outside = p1[1] - h - 3 >= 0  # label fits outside box
        cv2.putText(image, label, (p1[0], p1[1] - 2 if outside else p1[1] + h + 2), 0, thickness / 3, (0, 255, 255),
                    thickness=tf, lineType=cv2.LINE_AA)
        data_img = Resize(image)
        ShowImg(data_img, img_l)
        img_l.update()
    except:
        print('Can not detect face!')
 
def select_img():     #定义选择图片的函数
    path = askopenfilename()
    try:
        run(path)
    except:
        pass
 
if __name__ == '__main__':#主函数，程序入口
    root = tk.Tk()#创建tk窗体
    root.title("Face Detection Demo")#写好标题
    sc_width = root.winfo_screenwidth()#宽
    sc_height = root.winfo_screenheight()#高
    WID = 600  # 窗口宽
    HEI = 600  # 窗口高
    root.geometry('%dx%d+%d+%d' % (WID, HEI, (sc_width - WID) / 2, (sc_height - HEI) / 2 - 30))
    type = ('宋体', "12", 'normal')#字体
 
    up_frame = tk.Frame(root)
    tk.Button(up_frame, text='加载图片', command=select_img, font=type).pack(padx=1, side=tk.LEFT)#创建按钮
    tk.Button(up_frame, text='退出系统', command=root.destroy, font=type).pack(padx=1, side=tk.LEFT)
    up_frame.pack(pady=1, anchor='n')
 
    img_frame = tk.Frame(root)
    img_l = tk.Label(img_frame)
    img_l.pack()
    img_frame.pack(pady=20)
    root.mainloop()

展开全部

本回答被题主选为最佳回答 , 对您是否有帮助呢? 本回答被专家选为最佳回答 , 对您是否有帮助呢? 本回答被题主和专家选为最佳回答 , 对您是否有帮助呢?

CSDN专家-深度学习进阶 2022-03-15 01:05

如有帮助，请点击我评论上方【采纳该答案】按钮支持一下,谢谢！

CSDN专家-深度学习进阶回复 weixin_54532612 2022-03-15 01:30

这里好像只是单纯计算，没看到具体的阈值

CSDN专家-深度学习进阶回复 weixin_54532612 2022-03-15 06:29

建议你先从出处看看作者的介绍和相关的知识

展开全部4条评论

查看更多回答(1条)

编辑

预览

报告相同问题？

关注问题

基于MTCNN和FaceNet的实时人脸检测识别系统
2022-08-07 06:06

HarmoniaLeo的博客 MTCNN是强大的人脸特征提取器，我们采用MTCNN提取图像的特征，并利用FaceNet将图像特征映射到128维特征空间，随后在特征空间中比较人脸的相似性，进行人脸检测与识别。
利用MTCNN和facenet实现人脸检测和人脸识别
2019-05-14 03:16

老三是只猫的博客利用MTCNN和facenet实现人脸检测和人脸识别 人脸检测和人脸识别技术算是目前人工智能方面应用最成熟的技术了。本博客将利用mtcnn和faceNet搭建一个实现人脸检测和人脸识别的系统。基本思路也很简单，...
facenet mtcnn人脸口罩识别python编写
2023-01-03 07:52

"facenet mtcnn人脸口罩识别python编写"是一个利用Python编程语言实现的人脸识别系统，特别关注于判断人脸是否佩戴口罩。在这个项目中，主要涉及了两个关键的技术：Facenet和MTCNN。 Facenet是一种基于深度学习的...
基于Facenet和MTCNN的人脸识别系统（UI，python）
2024-05-09 09:01

xj30的博客毕业设计，课程设计，人脸识别，口罩识别
基于mtcnn+facenet+svm实现人脸识别系统GUI界面附完整代码数据集
2023-02-04 08:20

计算机毕设论文的博客基于mtcnn+facenet+svm实现人脸识别系统GUI界面附完整代码数据集
课程设计：Python基于MTCNN, iResNet50, Arcface的人脸识别与标注.zip
2022-07-08 06:34

在本课程设计中，我们将深入探讨使用Python进行人脸识别与标注的技术，主要涉及MTCNN（Multi-Task Cascaded Convolutional Networks）、iResNet50和Arcface算法。这些技术在计算机视觉领域，特别是人脸检测、识别和...
Python基于OpenCV的CNN人脸识别
2019-07-30 11:54

在本主题中，我们将深入探讨如何使用Python结合OpenCV库...总结起来，Python和OpenCV结合CNN模型提供了一种强大且灵活的方法来实现人脸识别。通过理解并实践这些知识点，开发者可以构建出具有实用价值的人脸识别系统。
(超详细)基于MTCNN+FaceNet实现人脸识别及轻量级网络探索和改进(附数据集及预训练模型)
2020-07-05 03:00

zhulu_20的博客首先会进行FaceNet原理介绍一、原理分析你好！这是你第一次使用 Markdown编辑器所展示的欢迎页。如果你想学习如何使用Markdown编辑器, 可以仔细阅读这篇文章，了解一下Markdown的基本语法知识。新的改变我们对...
基于facenet_pytorch实现人脸识别
2022-09-09 12:52

MrJson-架构师的博客介绍 facenet-pytorch库里面包含了两个重要功能：人脸检测和人脸识别，其中人脸检测部分使用mtcnn算法，人脸识别部分使用Facenet算法。利用这个库，可以轻松实现人脸检测和人脸向量映射操作。依赖安装 pip install ...
FaceNet+RetinaFace人脸识别管理系统【毕业设计、课程设计】
2023-03-15 14:58

《基于FaceNet+RetinaFace的人脸识别管理系统详解》 人脸识别技术在当今信息化社会中扮演着重要的角色，广泛应用于安全监控、门禁系统、社交媒体等多个领域。本项目以"FaceNet+RetinaFace人脸识别管理系统"为核心，...
python实现人脸识别代码
2020-09-20 17:51

Python 实现人脸识别是一种常见的计算机视觉任务，它利用机器学习算法，特别是支持向量机(SVM)和级联分类器等，来识别图像中的人脸。在这个案例中，我们使用了OpenCV库，这是一个广泛用于图像处理和计算机视觉的开源...
Python-基于facenet的实时人脸识别系统
2019-08-10 20:46

综上所述，基于facenet的实时人脸识别系统结合了深度学习的力量和Python的易用性，能够有效地处理实时视频流中的人脸识别任务。随着技术的不断发展，未来的人脸识别系统将更加智能化，应用范围也将更加广泛。
人脸检测MTCNN和人脸识别Facenet(附源码)
2018-12-05 02:51

tuuzhang的博客原文链接：人脸检测MTCNN和人脸识别Facenet(附源码) 在说到人脸检测我们首先会想到利用Harr特征提取和Adaboost分类器进行人脸检测(有兴趣的可以去一看这篇博客第九节、人脸检测之Haar分类器)，其检测效果也是不错的...
使用卷积神经网络（CNN）做人脸识别的示例代码
2020-09-17 08:07

模型构建时，我们可以选择使用预训练的模型，如VGGFace、FaceNet或OpenFace，这些模型已经在大规模人脸数据集上进行了预训练，可以直接用于人脸识别。如果没有预训练模型，我们需要从头开始训练，这可能需要大量的...
基于神经网络和OpenCV的人脸识别系统_python实现
2018-12-29 08:29

在这个“基于神经网络和OpenCV的人脸识别系统”中，你将找到完整的Python代码实现，这可能包括以下几个部分： 1. 数据预处理：可能包含图像的缩放、归一化以及灰度处理，以便于输入到神经网络。 2. 人脸检测：使用...
Python人脸识别签到.zip
2024-03-07 13:47

在本项目"Python人脸识别签到.zip"中，我们聚焦于使用Python编程语言实现人脸识别技术来构建一个签到系统。这个系统可能广泛应用于会议、学校、公司等场合，以自动化和安全的方式进行人员身份验证和签到流程。下面将...
基于Python的人脸识别系统的设计与实现.docx
2023-10-25 02:45

【基于Python的人脸识别系统的设计与实现】本文主要探讨了如何使用Python...综上所述，本论文详细阐述了基于Python的人脸识别系统的设计与实现，旨在为相关领域的研究者和开发者提供参考，推动人脸识别技术的发展。
深度学习五、MTCNN人脸检测与对齐和FaceNet人脸识别
2019-03-09 11:52

东城青年的博客在说到人脸检测我们首先会想到利用Harr特征和Adaboost分类器进行人脸检测，其检测效果也是不错的，但是目前人脸检测的应用场景逐渐从室内演变到室外，从单一限定场景发展到广场、车站、地铁口等场景，人脸检测面临的...
第三十七节、人脸检测MTCNN和人脸识别Facenet(附源码)
2018-09-30 14:57

Graceful_scenery的博客在说到人脸检测我们首先会想到利用Harr特征提取和Adaboost分类器进行人脸检测(有兴趣的可以去一看这篇博客第九节、人脸检测之Haar分类器)，其检测效果也是不错的，但是目前人脸检测的应用场景逐渐从室内演变到室外，...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
已结题（查看结题原因） 3月21日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
已采纳回答 3月15日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 3月14日