pyqt5中如何通过OpenCV读取一帧图像喂入网络呢？

我想通过pyqt5制作一个UI界面封装google object detection api的示例代码，源代码中是识别单张图片，我想通过摄像头输入一帧的图像然后进行识别显示。整个程序如下：

 # coding:utf-8
'''
V3.0A版本，尝试实现摄像头识别
'''
import numpy as np
import cv2
import os
import os.path
import six.moves.urllib as urllib
import sys
import tarfile
import tensorflow as tf
import zipfile
import pylab
from distutils.version import StrictVersion
from collections import defaultdict
from io import StringIO
from matplotlib import pyplot as plt
from PIL import Image
from PyQt5 import QtCore, QtGui, QtWidgets
from PyQt5.QtWidgets import *
from PyQt5.QtCore import *
from PyQt5.QtGui import *

class UiForm():
    openfile_name_pb = ''
    openfile_name_pbtxt = ''
    openpic_name = ''
    num_class = 0

    def setupUi(self, Form):
        Form.setObjectName("Form")
        Form.resize(600, 690)
        Form.setMinimumSize(QtCore.QSize(600, 690))
        Form.setMaximumSize(QtCore.QSize(600, 690))
        self.frame = QtWidgets.QFrame(Form)
        self.frame.setGeometry(QtCore.QRect(20, 20, 550, 100))
        self.frame.setFrameShape(QtWidgets.QFrame.StyledPanel)
        self.frame.setFrameShadow(QtWidgets.QFrame.Raised)
        self.frame.setObjectName("frame")
        self.horizontalLayout_2 = QtWidgets.QHBoxLayout(self.frame)
        self.horizontalLayout_2.setObjectName("horizontalLayout_2")
        # 加载模型文件按钮
        self.btn_add_file = QtWidgets.QPushButton(self.frame)
        self.btn_add_file.setObjectName("btn_add_file")
        self.horizontalLayout_2.addWidget(self.btn_add_file)
        # 加载pbtxt文件按钮
        self.btn_add_pbtxt = QtWidgets.QPushButton(self.frame)
        self.btn_add_pbtxt.setObjectName("btn_add_pbtxt")
        self.horizontalLayout_2.addWidget(self.btn_add_pbtxt)
        # 输入检测类别数目按钮
        self.btn_enter = QtWidgets.QPushButton(self.frame)
        self.btn_enter.setObjectName("btn_enter")
        self.horizontalLayout_2.addWidget(self.btn_enter)
        # 打开摄像头
        self.btn_opencam = QtWidgets.QPushButton(self.frame)
        self.btn_opencam.setObjectName("btn_objdec")
        self.horizontalLayout_2.addWidget(self.btn_opencam)
        # 开始识别按钮
        self.btn_objdec = QtWidgets.QPushButton(self.frame)
        self.btn_objdec.setObjectName("btn_objdec")
        self.horizontalLayout_2.addWidget(self.btn_objdec)
        # 退出按钮
        self.btn_exit = QtWidgets.QPushButton(self.frame)
        self.btn_exit.setObjectName("btn_exit")
        self.horizontalLayout_2.addWidget(self.btn_exit)
        # 显示识别后的画面
        self.lab_rawimg_show = QtWidgets.QLabel(Form)
        self.lab_rawimg_show.setGeometry(QtCore.QRect(50, 140, 500, 500))
        self.lab_rawimg_show.setMinimumSize(QtCore.QSize(500, 500))
        self.lab_rawimg_show.setMaximumSize(QtCore.QSize(500, 500))
        self.lab_rawimg_show.setObjectName("lab_rawimg_show")
        self.lab_rawimg_show.setStyleSheet(("border:2px solid red"))


        self.retranslateUi(Form)
        # 这里将按钮和定义的动作相连，通过click信号连接openfile槽？
        self.btn_add_file.clicked.connect(self.openpb)
        # 用于打开pbtxt文件
        self.btn_add_pbtxt.clicked.connect(self.openpbtxt)
        # 用于用户输入类别数
        self.btn_enter.clicked.connect(self.enter_num_cls)
        # 打开摄像头
        self.btn_opencam.clicked.connect(self.opencam)
        # 开始识别
        # ~ self.btn_objdec.clicked.connect(self.object_detection)
        # 这里是将btn_exit按钮和Form窗口相连，点击按钮发送关闭窗口命令
        self.btn_exit.clicked.connect(Form.close)
        QtCore.QMetaObject.connectSlotsByName(Form)

    def retranslateUi(self, Form):
        _translate = QtCore.QCoreApplication.translate
        Form.setWindowTitle(_translate("Form", "目标检测"))
        self.btn_add_file.setText(_translate("Form", "加载模型文件"))
        self.btn_add_pbtxt.setText(_translate("Form", "加载pbtxt文件"))
        self.btn_enter.setText(_translate("From", "指定识别类别数"))
        self.btn_opencam.setText(_translate("Form", "打开摄像头"))
        self.btn_objdec.setText(_translate("From", "开始识别"))
        self.btn_exit.setText(_translate("Form", "退出"))
        self.lab_rawimg_show.setText(_translate("Form", "识别效果"))

    def openpb(self):
        global openfile_name_pb
        openfile_name_pb, _ = QFileDialog.getOpenFileName(self.btn_add_file,'选择pb文件','/home/kanghao/','pb_files(*.pb)')
        print('加载模型文件地址为：' + str(openfile_name_pb))

    def openpbtxt(self):
        global openfile_name_pbtxt
        openfile_name_pbtxt, _ = QFileDialog.getOpenFileName(self.btn_add_pbtxt,'选择pbtxt文件','/home/kanghao/','pbtxt_files(*.pbtxt)')
        print('加载标签文件地址为：' + str(openfile_name_pbtxt))

    def opencam(self):
        self.camcapture = cv2.VideoCapture(0)
        self.timer = QtCore.QTimer()
        self.timer.start()
        self.timer.setInterval(100) # 0.1s刷新一次
        self.timer.timeout.connect(self.camshow)

    def camshow(self):
        global camimg
        _ , camimg = self.camcapture.read()
        print(_)
        camimg = cv2.resize(camimg, (512, 512))
        camimg = cv2.cvtColor(camimg, cv2.COLOR_BGR2RGB)
        print(type(camimg))
        #strcamimg = camimg.tostring()
        showImage = QtGui.QImage(camimg.data, camimg.shape[1], camimg.shape[0], QtGui.QImage.Format_RGB888)
        self.lab_rawimg_show.setPixmap(QtGui.QPixmap.fromImage(showImage))

    def enter_num_cls(self):
        global num_class
        num_class, okPressed = QInputDialog.getInt(self.btn_enter,'指定训练类别数','你的目标有多少类？',1,1,28,1)
        if okPressed:
            print('识别目标总类为：' + str(num_class))

    def img2pixmap(self, image):
        Y, X = image.shape[:2]
        self._bgra = np.zeros((Y, X, 4), dtype=np.uint8, order='C')
        self._bgra[..., 0] = image[..., 2]
        self._bgra[..., 1] = image[..., 1]
        self._bgra[..., 2] = image[..., 0]
        qimage = QtGui.QImage(self._bgra.data, X, Y, QtGui.QImage.Format_RGB32)
        pixmap = QtGui.QPixmap.fromImage(qimage)
        return pixmap

    def object_detection(self):
        sys.path.append("..")
        from object_detection.utils import ops as utils_ops

        if StrictVersion(tf.__version__) < StrictVersion('1.9.0'):
            raise ImportError('Please upgrade your TensorFlow installation to v1.9.* or later!')

        from utils import label_map_util

        from utils import visualization_utils as vis_util

        # Path to frozen detection graph. This is the actual model that is used for the object detection.
        PATH_TO_FROZEN_GRAPH = openfile_name_pb

        # List of the strings that is used to add correct label for each box.
        PATH_TO_LABELS = openfile_name_pbtxt

        NUM_CLASSES = num_class

        detection_graph = tf.Graph()
        with detection_graph.as_default():
          od_graph_def = tf.GraphDef()
          with tf.gfile.GFile(PATH_TO_FROZEN_GRAPH, 'rb') as fid:
            serialized_graph = fid.read()
            od_graph_def.ParseFromString(serialized_graph)
            tf.import_graph_def(od_graph_def, name='')

        category_index = label_map_util.create_category_index_from_labelmap(PATH_TO_LABELS, use_display_name=True)

        def load_image_into_numpy_array(image):
          (im_width, im_height) = image.size
          return np.array(image.getdata()).reshape(
              (im_height, im_width, 3)).astype(np.uint8)

        # For the sake of simplicity we will use only 2 images:
        # image1.jpg
        # image2.jpg
        # If you want to test the code with your images, just add path to the images to the TEST_IMAGE_PATHS.
        TEST_IMAGE_PATHS = camimg
        print(TEST_IMAGE_PATHS)
        # Size, in inches, of the output images.
        IMAGE_SIZE = (12, 8)

        def run_inference_for_single_image(image, graph):
          with graph.as_default():
            with tf.Session() as sess:
              # Get handles to input and output tensors
              ops = tf.get_default_graph().get_operations()
              all_tensor_names = {output.name for op in ops for output in op.outputs}
              tensor_dict = {}
              for key in [
                  'num_detections', 'detection_boxes', 'detection_scores',
                  'detection_classes', 'detection_masks'
              ]:
                tensor_name = key + ':0'
                if tensor_name in all_tensor_names:
                  tensor_dict[key] = tf.get_default_graph().get_tensor_by_name(
                      tensor_name)
              if 'detection_masks' in tensor_dict:
                # The following processing is only for single image
                detection_boxes = tf.squeeze(tensor_dict['detection_boxes'], [0])
                detection_masks = tf.squeeze(tensor_dict['detection_masks'], [0])
                # Reframe is required to translate mask from box coordinates to image coordinates and fit the image size.
                real_num_detection = tf.cast(tensor_dict['num_detections'][0], tf.int32)
                detection_boxes = tf.slice(detection_boxes, [0, 0], [real_num_detection, -1])
                detection_masks = tf.slice(detection_masks, [0, 0, 0], [real_num_detection, -1, -1])
                detection_masks_reframed = utils_ops.reframe_box_masks_to_image_masks(
                    detection_masks, detection_boxes, image.shape[0], image.shape[1])
                detection_masks_reframed = tf.cast(
                    tf.greater(detection_masks_reframed, 0.5), tf.uint8)
                # Follow the convention by adding back the batch dimension
                tensor_dict['detection_masks'] = tf.expand_dims(
                    detection_masks_reframed, 0)
              image_tensor = tf.get_default_graph().get_tensor_by_name('image_tensor:0')

              # Run inference
              output_dict = sess.run(tensor_dict,
                                     feed_dict={image_tensor: np.expand_dims(image, 0)})

              # all outputs are float32 numpy arrays, so convert types as appropriate
              output_dict['num_detections'] = int(output_dict['num_detections'][0])
              output_dict['detection_classes'] = output_dict[
                  'detection_classes'][0].astype(np.uint8)
              output_dict['detection_boxes'] = output_dict['detection_boxes'][0]
              output_dict['detection_scores'] = output_dict['detection_scores'][0]
              if 'detection_masks' in output_dict:
                output_dict['detection_masks'] = output_dict['detection_masks'][0]
          return output_dict


        #image = Image.open(TEST_IMAGE_PATHS)
        # the array based representation of the image will be used later in order to prepare the
        # result image with boxes and labels on it.
        image_np = load_image_into_numpy_array(TEST_IMAGE_PATHS)
        # Expand dimensions since the model expects images to have shape: [1, None, None, 3]
        image_np_expanded = np.expand_dims(image_np, axis=0)
        # Actual detection.
        output_dict = run_inference_for_single_image(image_np, detection_graph)
        # Visualization of the results of a detection.
        vis_util.visualize_boxes_and_labels_on_image_array(
            image_np,
            output_dict['detection_boxes'],
            output_dict['detection_classes'],
            output_dict['detection_scores'],
            category_index,
            instance_masks=output_dict.get('detection_masks'),
            use_normalized_coordinates=True,
            line_thickness=8)
        plt.figure(figsize=IMAGE_SIZE)
        plt.imshow(image_np)
        #plt.savefig(str(TEST_IMAGE_PATHS)+".jpg")

## 用于显示ui界面的命令
if __name__ == "__main__":
    app = QtWidgets.QApplication(sys.argv)
    Window = QtWidgets.QWidget()
    # ui为根据类Ui_From()创建的实例
    ui = UiForm()
    ui.setupUi(Window)
    Window.show()
    sys.exit(app.exec_())

但是运行提示：

求助

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

1条回答

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
Masec 2018-11-30 10:17
关注
问题已解决……
完全不需要load_image_into_numpy_array这个函数了啊……我现在输入的本来就是numpy.array的图片了……

本回答被题主选为最佳回答 , 对您是否有帮助呢?

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

pyqt5中如何通过OpenCV读取一帧图像喂入网络呢？ opencv
2018-11-30 08:37

回答 1 已采纳问题已解决…… 完全不需要load_image_into_numpy_array这个函数了啊……我现在输入的本来就是numpy.array的图片了……
pyqt5中的QLabel如何实现点击按钮后更新里面的文本呢？ python qt 有问必答
2022-03-13 02:47

回答 2 已采纳按下对应按钮直接设置不行吗？label.setText("02")
PyQt5中如何在lable中加载的图片上绘制矩形框呢？ python
2018-12-12 08:02

回答 1 已采纳 emmmm……解决了……手动笑哭脸。定义了一个QLable类，在这个类中定义鼠标事件。然后将self.show（show这个名字起的很不好……改成了showimg）这个lable改为我们定义的l
【人机交互】pyqt5+opencv对人脸进行识别
2022-04-18 17:02

只搬烫手的砖的博客解决问题：通过pyqt5对opencv人脸识别模块进行调用文章目录1. pyqt5界面的设计 1. pyqt5界面的设计
python实现PyQt5中QFontComboBox所选字体的路径和文件名读取 pycharm python qt 有问必答
2022-02-27 13:55

回答 3 已采纳使用信号/槽机制：（1）QFontComboBox 中的选项选中动作作为触发信号，连接对应的字体选择槽函数；（2）例如选择“黑体”动作，连接槽函数 heitiSetup() 槽函数，函数 heitiS
pyqt5中如何将类class中的方法中的参数调用至另一个函数 python qt 有问必答
2021-11-14 22:34

回答 3 已采纳把pathhm变成类属性，赋予初始值，然后在b中实例化，再调用属性就可以了
做后台管理系统还是用PYQT5做个小软件用呢？ django python vue.js
2022-11-12 21:01

回答 4 已采纳一、前置总结了一下你目前的几个问题（已知条件）：个人原因可以说是小白，技术上并不满足实现需求的标准自己了解一些 python，并且使用了 pandas 以及 xlwt 这些目前（改革）通过手动录入
基于opencv和PyQt5的人脸识别
2023-08-21 14:42

宝宝巴逝的博客结合opencv和PyQt5做视频(摄像头)的人脸识别
如何用pyqt5的Qprogressbar控件做一个显示脚本运行进度的进度条？ python qt 有问必答
2022-04-19 22:06

回答 2 已采纳 import os import sys from PyQt5.QtCore import QBasicTimer from PyQt5.QtWidgets import QApplication
如何去除PyQt5中textEdit与窗体之间的空隙？ python
2022-05-10 15:06

回答 2 已采纳题主是用QBoxLayout布局吧？Qt这一点很不人性，QVBoxLayout里面上下左右各有11像素的留白，要想去掉，试试我这个方法。参考代码如下。 import sys from PyQt6.Qt
选择pyqt5+mysql还是django+vue呢？ django python vue.js
2022-11-09 12:07

回答 5 已采纳改成这个django+vue+mysql，是不有答案了呢？后者成本会高，纯粹为了开发这个功能可以前者，毕竟技术栈少点，如果为了提升自己挑战下可以后者
基于pyqt5与opencv读取播放本地视频
2023-10-25 09:20

人工智能教学实践的博客对象，并将其设置为窗口的中央部件。设置窗口的初始大小为800x600像素，并设置窗口标题为"视频播放"。最后，启动应用程序的事件循环，并确保程序正常退出。...为True），将帧从BGR...，并开始定时器以读取和显示视频帧。
pyqt5做界面，如何通过按钮获取指定的txt文件中的文本内容，然后显示到文本框中？ python
2020-05-13 17:44

回答 2 已采纳思路如下：1）打开文件并读取其内容；2）设置翻译按钮的动作指令，即将文本内容添加至文本框中。 ``` fileAddress = "D:/咕咕鸡系列/咕咕鸡.txt"
PyQt5 | PyQt5打开图片、视频、摄像头
2022-11-06 14:16

迪菲赫尔曼的博客 PyQt5实现打开图片，打开视频，打开摄像头教程
消除Python OpenCV显示摄像头画面的延迟
2023-02-02 21:12

__弯弓__的博客用 Python 通过 OpenCV显示摄像头画面时，可能出现画面延迟，显示的...解决方案，自定义1上读取视频帧的类取代opencv的VideoCapture，通过后台工作线程实时读帧，放入队列，同时删除旧帧，oepncv显示时从新类中取帧。
没有解决我的问题, 去提问

悬赏问题

¥15 如何处理复杂数据表格的除法运算
¥15 如何用stc8h1k08的片子做485数据透传的功能？(关键词-串口)
¥15 有兄弟姐妹会用word插图功能制作类似citespace的图片吗？
¥200 uniapp长期运行卡死问题解决
¥15 请教：如何用postman调用本地虚拟机区块链接上的合约？
¥15 为什么使用javacv转封装rtsp为rtmp时出现如下问题：[h264 @ 000000004faf7500]no frame？
¥15 乘性高斯噪声在深度学习网络中的应用
¥15 关于docker部署flink集成hadoop的yarn，请教个问题 flink启动yarn-session.sh连不上hadoop，这个整了好几天一直不行，求帮忙看一下怎么解决
¥15 深度学习根据CNN网络模型，搭建BP模型并训练MNIST数据集
¥15 C++ 头文件/宏冲突问题解决