mtcnn和facenet实现部分遮挡下的人脸识别

问题遇到的现象和发生背景

问题相关代码，请勿粘贴截图

运行结果及报错内容

我的解答思路和尝试过的方法

我想要达到的结果

对于这些代码我还不太清楚，希望可以帮我用中文详细注释一下代码，谢谢。
``

from facenet import MTCNN, InceptionResnetV1
from torchvision.transforms import functional as F
import numpy as np
import matplotlib.pyplot as plt
import cv2
from PIL import Image
from scipy.spatial.distance import canberra
from sklearn.preprocessing import Normalizer
import torch
import tkinter as tk
from tkinter.filedialog import askopenfilename
from PIL import Image, ImageTk

max_w_h = (700, 500)

def ShowImg(img, img_labels):
    rgba_img = cv2.cvtColor(img, cv2.COLOR_BGR2RGBA)
    show_img = Image.fromarray(rgba_img)
    show_img = ImageTk.PhotoImage(show_img)
    img_labels.config(image=show_img)
    img_labels.image = show_img

def Resize(img):
    h, w, _ = img.shape
    ratio = h / w
    if max_w_h[0] * ratio > max_w_h[1]:
        return cv2.resize(img, (int(max_w_h[1] / ratio), int(max_w_h[1])))
    else:
        return cv2.resize(img, (int(max_w_h[0]), int(max_w_h[0] * ratio)))

gpu = False
device = torch.device('cuda:0' if gpu & torch.cuda.is_available() else 'cpu')
print('Running on device: {}'.format(device))

# loading the facenet model
facerec = InceptionResnetV1(pretrained='vggface2').eval().to(device)

# Loading the mtcnn model
mtcnn = MTCNN(margin=30, device=device)
l2_encoder = Normalizer(norm='l2')

# load trained faces
data = np.load('data.npz')
trainx_embed, trainy = data['a'], data['b']

def calculate_distance(embedding, known_faces, known_labels):
    store = dict()
    for i in known_labels:
        if i not in store:
            store[i] = []
    for i in range(known_faces.shape[0]):
        store[known_labels[i]].append(canberra(embedding, known_faces[i]))
    for i in store.keys():
        store[i] = sum(store[i]) / len(store[i])
    dist = min(store.values())
    for i in store:
        if store[i] == dist:
            return (dist, i)

def run(imgp):
    try:
        img = Image.open(imgp)
        _, img_cropped, box = mtcnn(img)
        face_array = np.array(img_cropped)
        face_pixels = F.to_tensor(np.float32(face_array))
        face_pixels = (face_pixels - 127.5) / 128.0
        feas = facerec(face_pixels.unsqueeze(0).to(device))
        feas = feas.cpu().detach().numpy()
        distance, label = calculate_distance(feas, trainx_embed, trainy)
        print(label)
        # plot
        image = cv2.imread(imgp)
        if distance > 350:  # 368
            label = "UNKNOWN"
        p1, p2 = (int(box[0]), int(box[1])), (int(box[2]), int(box[3]))
        thickness = max(round(sum(image.shape) / 2 * 0.003), 2)
        cv2.rectangle(image, p1, p2, (0, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
        tf = max(thickness - 1, 1)  # font thickness
        w, h = cv2.getTextSize(label, 0, fontScale=thickness / 3, thickness=tf)[0]  # text width, height
        outside = p1[1] - h - 3 >= 0  # label fits outside box
        cv2.putText(image, label, (p1[0], p1[1] - 2 if outside else p1[1] + h + 2), 0, thickness / 3, (0, 255, 255),
                    thickness=tf, lineType=cv2.LINE_AA)
        data_img = Resize(image)
        ShowImg(data_img, img_l)
        img_l.update()
    except:
        print('Can not detect face!')

def select_img():
    path = askopenfilename()
    try:
        run(path)
    except:
        pass

if __name__ == '__main__':
    root = tk.Tk()
    root.title("Face Detection Demo")
    sc_width = root.winfo_screenwidth()
    sc_height = root.winfo_screenheight()
    WID = 600  # 窗口宽
    HEI = 600  # 窗口高
    root.geometry('%dx%d+%d+%d' % (WID, HEI, (sc_width - WID) / 2, (sc_height - HEI) / 2 - 30))
    type = ('宋体', "12", 'normal')

    up_frame = tk.Frame(root)
    tk.Button(up_frame, text='加载图片', command=select_img, font=type).pack(padx=1, side=tk.LEFT)
    tk.Button(up_frame, text='退出系统', command=root.destroy, font=type).pack(padx=1, side=tk.LEFT)
    up_frame.pack(pady=1, anchor='n')

    img_frame = tk.Frame(root)
    img_l = tk.Label(img_frame)
    img_l.pack()
    img_frame.pack(pady=20)
    root.mainloop()

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

2条回答默认最新

CSDN专家-深度学习进阶 2022-03-15 09:05

关注

对应代码块后面#写了注释

from facenet import MTCNN, InceptionResnetV1             #导入各种需要用到的包
from torchvision.transforms import functional as F
import numpy as np
import matplotlib.pyplot as plt
import cv2
from PIL import Image
from scipy.spatial.distance import canberra
from sklearn.preprocessing import Normalizer
import torch
import tkinter as tk
from tkinter.filedialog import askopenfilename
from PIL import Image, ImageTk
 
max_w_h = (700, 500)
 
def ShowImg(img, img_labels):      #定义展示图片的函数
    rgba_img = cv2.cvtColor(img, cv2.COLOR_BGR2RGBA)
    show_img = Image.fromarray(rgba_img)
    show_img = ImageTk.PhotoImage(show_img)
    img_labels.config(image=show_img)
    img_labels.image = show_img
 
def Resize(img):                    #定义图片改变大小的函数
    h, w, _ = img.shape
    ratio = h / w
    if max_w_h[0] * ratio > max_w_h[1]:
        return cv2.resize(img, (int(max_w_h[1] / ratio), int(max_w_h[1])))
    else:
        return cv2.resize(img, (int(max_w_h[0]), int(max_w_h[0] * ratio)))
 
gpu = False
device = torch.device('cuda:0' if gpu & torch.cuda.is_available() else 'cpu')
print('Running on device: {}'.format(device))     #如果gpu可用就用gpu，否则使用CPU
 
# loading the facenet model
facerec = InceptionResnetV1(pretrained='vggface2').eval().to(device)    #加载facenet模型
 
# Loading the mtcnn model
mtcnn = MTCNN(margin=30, device=device)     #加载mtcnn模型
l2_encoder = Normalizer(norm='l2')
 
# load trained faces
data = np.load('data.npz')      #加载训练的数据
trainx_embed, trainy = data['a'], data['b']
 
def calculate_distance(embedding, known_faces, known_labels):  #定义计算距离的函数
    store = dict()
    for i in known_labels:
        if i not in store:
            store[i] = []
    for i in range(known_faces.shape[0]):
        store[known_labels[i]].append(canberra(embedding, known_faces[i]))
    for i in store.keys():
        store[i] = sum(store[i]) / len(store[i])
    dist = min(store.values())
    for i in store:
        if store[i] == dist:
            return (dist, i)
 
def run(imgp):        #定义运行的过程
    try:
        img = Image.open(imgp)
        _, img_cropped, box = mtcnn(img)
        face_array = np.array(img_cropped)
        face_pixels = F.to_tensor(np.float32(face_array))
        face_pixels = (face_pixels - 127.5) / 128.0
        feas = facerec(face_pixels.unsqueeze(0).to(device))
        feas = feas.cpu().detach().numpy()
        distance, label = calculate_distance(feas, trainx_embed, trainy)
        print(label)
        # plot
        image = cv2.imread(imgp)
        if distance > 350:  # 368
            label = "UNKNOWN"
        p1, p2 = (int(box[0]), int(box[1])), (int(box[2]), int(box[3]))
        thickness = max(round(sum(image.shape) / 2 * 0.003), 2)
        cv2.rectangle(image, p1, p2, (0, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
        tf = max(thickness - 1, 1)  # font thickness
        w, h = cv2.getTextSize(label, 0, fontScale=thickness / 3, thickness=tf)[0]  # text width, height
        outside = p1[1] - h - 3 >= 0  # label fits outside box
        cv2.putText(image, label, (p1[0], p1[1] - 2 if outside else p1[1] + h + 2), 0, thickness / 3, (0, 255, 255),
                    thickness=tf, lineType=cv2.LINE_AA)
        data_img = Resize(image)
        ShowImg(data_img, img_l)
        img_l.update()
    except:
        print('Can not detect face!')
 
def select_img():     #定义选择图片的函数
    path = askopenfilename()
    try:
        run(path)
    except:
        pass
 
if __name__ == '__main__':#主函数，程序入口
    root = tk.Tk()#创建tk窗体
    root.title("Face Detection Demo")#写好标题
    sc_width = root.winfo_screenwidth()#宽
    sc_height = root.winfo_screenheight()#高
    WID = 600  # 窗口宽
    HEI = 600  # 窗口高
    root.geometry('%dx%d+%d+%d' % (WID, HEI, (sc_width - WID) / 2, (sc_height - HEI) / 2 - 30))
    type = ('宋体', "12", 'normal')#字体
 
    up_frame = tk.Frame(root)
    tk.Button(up_frame, text='加载图片', command=select_img, font=type).pack(padx=1, side=tk.LEFT)#创建按钮
    tk.Button(up_frame, text='退出系统', command=root.destroy, font=type).pack(padx=1, side=tk.LEFT)
    up_frame.pack(pady=1, anchor='n')
 
    img_frame = tk.Frame(root)
    img_l = tk.Label(img_frame)
    img_l.pack()
    img_frame.pack(pady=20)
    root.mainloop()

本回答被题主选为最佳回答 , 对您是否有帮助呢?

查看更多回答(1条)

报告相同问题？

关注问题

mtcnn和facenet实现部分遮挡下的人脸识别 python 有问必答深度学习
2022-03-14 16:42

回答 2 已采纳对应代码块后面#写了注释 from facenet import MTCNN, InceptionResnetV1 #导入各种需要用到的包 from torchvision.t
css实现高斯模糊，毛玻璃遮挡效果 css
2021-08-17 15:54

回答 1 已采纳 filter: blur(20px); 属性
Qt菜单栏被dock和中心工作区遮挡 c++ qt
2022-09-26 21:16

回答 1 已采纳你的主窗口是派生于QMainWindow吗？QMainWindow内部会自动管理menuBar, statusBar, docker widgets,和centeral widget，不会出现遮挡情况
基于MTCNN和FaceNet的实时人脸检测识别系统
2022-08-07 14:06

HarmoniaLeo的博客 MTCNN是强大的人脸特征提取器，我们采用MTCNN提取图像的特征，并利用FaceNet将图像特征映射到128维特征空间，随后在特征空间中比较人脸的相似性，进行人脸检测与识别。
mui框架自带的底部导航栏遮挡住了部分样式求解～ css3 html5
2022-01-01 16:35

回答 2 已采纳把内容容器设置padding-bottom: 底部高度
同时使用weifenluo 和 ToolStip 控件会遮挡 c# visual studio
2020-09-13 21:56

回答 2 已采纳 weifenluo 是什么东西？toolstrip 么？注意下添加的顺序，先把 tpplstrip放上去，点窗口客户区，再添加 panel 设置panel 的 dockstyle 为 fill
如何识别被覆盖的文字 python 问答团队
2023-03-22 15:46

回答 2 已采纳识别印章下被遮挡的文字需要结合计算机视觉和OCR（Optical Character Recognition）技术。以下是一些可以学习的方向：图像处理和计算机视觉：图像处理和计算机视觉是必不可少的基
利用MTCNN和facenet实现人脸检测和人脸识别
2019-05-14 11:16

老三是只猫的博客利用MTCNN和facenet实现人脸检测和人脸识别 人脸检测和人脸识别技术算是目前人工智能方面应用最成熟的技术了。本博客将利用mtcnn和faceNet搭建一个实现人脸检测和人脸识别的系统。基本思路也很简单，...
基于c++与opencv实现图像识别定位？ c++
2020-02-28 11:01

回答 3 已采纳 1. 霍夫直线识别出四个直线(先预处理图片) 2. 取同一直线上的较远的两个点(霍夫直线出来后相当于4个点阵每个点阵就是一条直线),算出直线方程, 4条操作相同 3. 算出两个十字标的交点(第二
python绘制前后2个长方体，前面的长方体显示不了？ python 有问必答
2021-05-06 17:17

回答 5 已采纳是代码设置位置不同？还是参数设置问题
pyecharts画图，有的时候标签和数据显示重叠了怎么办 python
2021-03-03 22:30

回答 4 已采纳 from pyecharts import options as opts from pyecharts.charts import Gauge c = ( Gauge() .ad
基于mtcnn+facenet+svm实现人脸识别系统GUI界面附完整代码数据集
2023-02-04 16:20

计算机毕设论文的博客基于mtcnn+facenet+svm实现人脸识别系统GUI界面附完整代码数据集
python pyecharts page怎么设置各张图的间隔 html5 python
2018-11-17 07:14

回答 1 已采纳调整xaxis_rotate角度已解决
(超详细)基于MTCNN+FaceNet实现人脸识别及轻量级网络探索和改进(附数据集及预训练模型)
2020-07-05 11:00

zhulu_20的博客首先会进行FaceNet原理介绍一、原理分析你好！这是你第一次使用 Markdown编辑器所展示的欢迎页。如果你想学习如何使用Markdown编辑器, 可以仔细阅读这篇文章，了解一下Markdown的基本语法知识。新的改变我们对...
基于facenet_pytorch实现人脸识别
2022-09-09 20:52

MrJson-架构师的博客介绍 facenet-pytorch库里面包含了两个重要功能：人脸检测和人脸识别，其中人脸检测部分使用mtcnn算法，人脸识别部分使用Facenet算法。利用这个库，可以轻松实现人脸检测和人脸向量映射操作。依赖安装 pip install ...
深度学习五、MTCNN人脸检测与对齐和FaceNet人脸识别
2019-03-09 19:52

东城青年的博客在说到人脸检测我们首先会想到利用Harr特征和Adaboost分类器进行人脸检测，其检测效果也是不错的，但是目前人脸检测的应用场景逐渐从室内演变到室外，从单一限定场景发展到广场、车站、地铁口等场景，人脸检测面临的...
人脸检测MTCNN和人脸识别Facenet(附源码)
2018-12-05 10:51

tuuzhang的博客原文链接：人脸检测MTCNN和人脸识别Facenet(附源码) 在说到人脸检测我们首先会想到利用Harr特征提取和Adaboost分类器进行人脸检测(有兴趣的可以去一看这篇博客第九节、人脸检测之Haar分类器)，其检测效果也是不错的...
原理讲解-项目实战＜-＞Mtcnn+Mobilent实现人脸口罩检测
2022-06-10 15:05

码农的后花园的博客这里主要针对Mobilent网络进行训练，首先设置训练模型保存权重的位置，...总结Mtcnn分为四步，分别是图像金字塔先把输入图片进行缩放，缩放完成之后，我们可以提取出大的人脸和小的人脸，使得网络提取的效果更有效。..
深度学习人脸检测与人脸识别
2021-12-13 01:01

白拾Official的博客 人脸识别是对人脸图像身份进行确认，人脸识别通常会先对人脸进行检测定位，再进行识别；人脸检索是根据输入的人脸图像，从图像库或视频库中检索包含该人脸的其它图像或视频。 2. 人脸检测与识别的应用实名认证 ...
（转）第三十七节、人脸检测MTCNN和人脸识别Facenet(附源码)
2019-03-03 16:16

zyb418的博客在说到人脸检测我们首先会想到利用Harr特征提取和Adaboost分类器进行人脸检测(有兴趣的可以去一看这篇博客第九节、人脸检测之Haar分类器)，其检测效果也是不错的，但是目前人脸检测的应用场景逐渐从室内演变到室外，...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
已结题（查看结题原因） 3月21日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
已采纳回答 3月15日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 3月14日

悬赏问题

¥15 对于这个复杂问题的解释说明
¥50 三种调度算法报错有实例
¥15 关于#python#的问题，请各位专家解答！
¥200 询问：python实现大地主题正反算的程序设计，有偿
¥15 smptlib使用465端口发送邮件失败
¥200 总是报错，能帮助用python实现程序实现高斯正反算吗？有偿
¥15 对于squad数据集的基于bert模型的微调
¥15 为什么我运行这个网络会出现以下报错？CRNN神经网络
¥20 steam下载游戏占用内存
¥15 CST保存项目时失败

mtcnn和facenet实现部分遮挡下的人脸识别

问题遇到的现象和发生背景

问题相关代码，请勿粘贴截图

运行结果及报错内容

我的解答思路和尝试过的方法

我想要达到的结果

2条回答 默认 最新

问题事件

悬赏问题

2条回答默认最新