【學習筆記】pyQt5學習筆記(4）——第一個影象識別demoV3.0B

阿新 • • 發佈：2019-01-02

軟體更新日誌V3.0B版本，在2.0基礎上實現了呼叫攝像頭的實時識別功能。V3.0A版若不實時重新整理識別畫面，可以手動點一次識別一次……

附上完整程式碼，也是做個程式碼備份。需要的小夥伴自取就ok～

軟體目前存在的bug是1.在開始識別後會很卡，目前認為可能的原因是每次重新整理都重複載入了模型檔案；2.攝像頭畫面與實時識別畫面比例不一樣，後期優化一下。

# coding:utf-8
'''
V3.0B版本，實現攝像頭識別,實時重新整理顯示結果
@author:kangshifu
'''
import numpy as np
import cv2
import os
import os.path
import six.moves.urllib as urllib
import sys
import tarfile
import tensorflow as tf
import zipfile
import pylab
from distutils.version import StrictVersion
from collections import defaultdict
from io import StringIO
from matplotlib import pyplot as plt
from PIL import Image
from PyQt5 import QtCore, QtGui, QtWidgets
from PyQt5.QtWidgets import *
from PyQt5.QtCore import *
from PyQt5.QtGui import *

class UiForm():

    def setupUi(self, Form):
        Form.setObjectName("Form")
        Form.resize(600, 420)
        Form.setMinimumSize(QtCore.QSize(600, 420))
        Form.setMaximumSize(QtCore.QSize(600, 420))
        self.frame = QtWidgets.QFrame(Form)
        self.frame.setGeometry(QtCore.QRect(20, 20, 550, 100))
        self.frame.setFrameShape(QtWidgets.QFrame.StyledPanel)
        self.frame.setFrameShadow(QtWidgets.QFrame.Raised)
        self.frame.setObjectName("frame")
        self.horizontalLayout_2 = QtWidgets.QHBoxLayout(self.frame)
        self.horizontalLayout_2.setObjectName("horizontalLayout_2")
        # 載入模型檔案按鈕
        self.btn_add_file = QtWidgets.QPushButton(self.frame)
        self.btn_add_file.setObjectName("btn_add_file")
        self.horizontalLayout_2.addWidget(self.btn_add_file)
        # 載入pbtxt檔案按鈕
        self.btn_add_pbtxt = QtWidgets.QPushButton(self.frame)
        self.btn_add_pbtxt.setObjectName("btn_add_pbtxt")
        self.horizontalLayout_2.addWidget(self.btn_add_pbtxt)
        # 輸入檢測類別數目按鈕
        self.btn_enter = QtWidgets.QPushButton(self.frame)
        self.btn_enter.setObjectName("btn_enter")
        self.horizontalLayout_2.addWidget(self.btn_enter)
        # 開啟攝像頭
        self.btn_opencam = QtWidgets.QPushButton(self.frame)
        self.btn_opencam.setObjectName("btn_objdec")
        self.horizontalLayout_2.addWidget(self.btn_opencam)
        # 開始識別按鈕
        self.btn_objdec = QtWidgets.QPushButton(self.frame)
        self.btn_objdec.setObjectName("btn_objdec")
        self.horizontalLayout_2.addWidget(self.btn_objdec)
        # 退出按鈕
        self.btn_exit = QtWidgets.QPushButton(self.frame)
        self.btn_exit.setObjectName("btn_exit")
        self.horizontalLayout_2.addWidget(self.btn_exit)
        # 顯示攝像頭的畫面
        self.lab_rawimg_show = QtWidgets.QLabel(Form)
        self.lab_rawimg_show.setGeometry(QtCore.QRect(20, 140, 260, 260))
        self.lab_rawimg_show.setMinimumSize(QtCore.QSize(260, 260))
        self.lab_rawimg_show.setMaximumSize(QtCore.QSize(260, 260))
        self.lab_rawimg_show.setObjectName("lab_rawimg_show")
        self.lab_rawimg_show.setStyleSheet(("border:2px solid red"))

        # 顯示攝像頭的畫面
        self.lab_decimg_show = QtWidgets.QLabel(Form)
        self.lab_decimg_show.setGeometry(QtCore.QRect(300, 140, 260, 260))
        self.lab_decimg_show.setMinimumSize(QtCore.QSize(260, 260))
        self.lab_decimg_show.setMaximumSize(QtCore.QSize(260, 260))
        self.lab_decimg_show.setObjectName("lab_decimgimg_show")
        self.lab_decimg_show.setStyleSheet(("border:2px solid green"))
        
        self.retranslateUi(Form)
        # 這裡將按鈕和定義的動作相連，通過click訊號連線openfile槽？
        self.btn_add_file.clicked.connect(self.openpb)
        # 用於開啟pbtxt檔案
        self.btn_add_pbtxt.clicked.connect(self.openpbtxt)
        # 用於使用者輸入類別數
        self.btn_enter.clicked.connect(self.enter_num_cls)
        # 開啟攝像頭
        self.btn_opencam.clicked.connect(self.opencam)
        # 開始識別
        self.btn_objdec.clicked.connect(self.refresh_objdec)
        # 這裡是將btn_exit按鈕和Form視窗相連，點選按鈕傳送關閉視窗命令
        self.btn_exit.clicked.connect(Form.close)
        QtCore.QMetaObject.connectSlotsByName(Form)

    def retranslateUi(self, Form):
        _translate = QtCore.QCoreApplication.translate
        Form.setWindowTitle(_translate("Form", "目標檢測"))
        self.btn_add_file.setText(_translate("Form", "載入模型檔案"))
        self.btn_add_pbtxt.setText(_translate("Form", "載入pbtxt檔案"))
        self.btn_enter.setText(_translate("From", "指定識別類別數"))
        self.btn_opencam.setText(_translate("Form", "開啟攝像頭"))
        self.btn_objdec.setText(_translate("From", "開始識別"))
        self.btn_exit.setText(_translate("Form", "退出"))
        self.lab_rawimg_show.setText(_translate("Form", "攝像頭原始畫面"))
        self.lab_decimg_show.setText(_translate("Form", "實時識別效果"))
        
    def openpb(self):
        global openfile_name_pb
        openfile_name_pb, _ = QFileDialog.getOpenFileName(self.btn_add_file,'選擇pb檔案','/home/kanghao/','pb_files(*.pb)')
        print('載入模型檔案地址為：' + str(openfile_name_pb))
        
    def openpbtxt(self):
        global openfile_name_pbtxt
        openfile_name_pbtxt, _ = QFileDialog.getOpenFileName(self.btn_add_pbtxt,'選擇pbtxt檔案','/home/kanghao/','pbtxt_files(*.pbtxt)')
        print('載入標籤檔案地址為：' + str(openfile_name_pbtxt))
    
    def opencam(self):
        self.camcapture = cv2.VideoCapture(0)
        self.timer = QtCore.QTimer()
        self.timer.start()
        self.timer.setInterval(3) # 0.1s重新整理一次
        self.timer.timeout.connect(self.camshow)
        
    def camshow(self):
        global camimg
        _ , camimg = self.camcapture.read()
        # ~ print(_)
        #camimg = cv2.resize(camimg, (512, 512))
        camimg = cv2.cvtColor(camimg, cv2.COLOR_BGR2RGB)
        # ~ print(type(camimg))
        #strcamimg = camimg.tostring()
        showImage = QtGui.QImage(camimg.data, camimg.shape[1], camimg.shape[0], QtGui.QImage.Format_RGB888)
        self.lab_rawimg_show.setPixmap(QtGui.QPixmap.fromImage(showImage))
        
    def enter_num_cls(self):
        global num_class
        num_class, okPressed = QInputDialog.getInt(self.btn_enter,'指定訓練類別數','你的目標有多少類？',1,1,28,1)
        if okPressed:
            print('識別目標總類為：' + str(num_class))

    def img2pixmap(self, image):
        Y, X = image.shape[:2]
        self._bgra = np.zeros((Y, X, 4), dtype=np.uint8, order='C')
        self._bgra[..., 0] = image[..., 2]
        self._bgra[..., 1] = image[..., 1]
        self._bgra[..., 2] = image[..., 0]
        qimage = QtGui.QImage(self._bgra.data, X, Y, QtGui.QImage.Format_RGB32)
        pixmap = QtGui.QPixmap.fromImage(qimage)
        return pixmap

    def refresh_objdec(self):
        self.timerdec = QtCore.QTimer()
        self.timerdec.start()
        self.timerdec.setInterval(0.3) # 0.1s重新整理一次
        self.timerdec.timeout.connect(self.object_detection)

    def object_detection(self):
        sys.path.append("..")
        from object_detection.utils import ops as utils_ops

        if StrictVersion(tf.__version__) < StrictVersion('1.9.0'):
            raise ImportError('Please upgrade your TensorFlow installation to v1.9.* or later!')
        
        from utils import label_map_util

        from utils import visualization_utils as vis_util

        # Path to frozen detection graph. This is the actual model that is used for the object detection.
        PATH_TO_FROZEN_GRAPH = openfile_name_pb

        # List of the strings that is used to add correct label for each box.
        PATH_TO_LABELS = openfile_name_pbtxt

        NUM_CLASSES = num_class

        detection_graph = tf.Graph()
        with detection_graph.as_default():
          od_graph_def = tf.GraphDef()
          with tf.gfile.GFile(PATH_TO_FROZEN_GRAPH, 'rb') as fid:
            serialized_graph = fid.read()
            od_graph_def.ParseFromString(serialized_graph)
            tf.import_graph_def(od_graph_def, name='')
            
        category_index = label_map_util.create_category_index_from_labelmap(PATH_TO_LABELS, use_display_name=True)

            
        # For the sake of simplicity we will use only 2 images:
        # image1.jpg
        # image2.jpg
        # If you want to test the code with your images, just add path to the images to the TEST_IMAGE_PATHS.
        TEST_IMAGE_PATHS = camimg
        print(TEST_IMAGE_PATHS)
        # Size, in inches, of the output images.
        IMAGE_SIZE = (12, 8)

        def run_inference_for_single_image(image, graph):
          with graph.as_default():
            with tf.Session() as sess:
              # Get handles to input and output tensors
              ops = tf.get_default_graph().get_operations()
              all_tensor_names = {output.name for op in ops for output in op.outputs}
              tensor_dict = {}
              for key in [
                  'num_detections', 'detection_boxes', 'detection_scores',
                  'detection_classes', 'detection_masks'
              ]:
                tensor_name = key + ':0'
                if tensor_name in all_tensor_names:
                  tensor_dict[key] = tf.get_default_graph().get_tensor_by_name(
                      tensor_name)
              if 'detection_masks' in tensor_dict:
                # The following processing is only for single image
                detection_boxes = tf.squeeze(tensor_dict['detection_boxes'], [0])
                detection_masks = tf.squeeze(tensor_dict['detection_masks'], [0])
                # Reframe is required to translate mask from box coordinates to image coordinates and fit the image size.
                real_num_detection = tf.cast(tensor_dict['num_detections'][0], tf.int32)
                detection_boxes = tf.slice(detection_boxes, [0, 0], [real_num_detection, -1])
                detection_masks = tf.slice(detection_masks, [0, 0, 0], [real_num_detection, -1, -1])
                detection_masks_reframed = utils_ops.reframe_box_masks_to_image_masks(
                    detection_masks, detection_boxes, image.shape[0], image.shape[1])
                detection_masks_reframed = tf.cast(
                    tf.greater(detection_masks_reframed, 0.5), tf.uint8)
                # Follow the convention by adding back the batch dimension
                tensor_dict['detection_masks'] = tf.expand_dims(
                    detection_masks_reframed, 0)
              image_tensor = tf.get_default_graph().get_tensor_by_name('image_tensor:0')

              # Run inference
              output_dict = sess.run(tensor_dict,
                                     feed_dict={image_tensor: np.expand_dims(image, 0)})

              # all outputs are float32 numpy arrays, so convert types as appropriate
              output_dict['num_detections'] = int(output_dict['num_detections'][0])
              output_dict['detection_classes'] = output_dict[
                  'detection_classes'][0].astype(np.uint8)
              output_dict['detection_boxes'] = output_dict['detection_boxes'][0]
              output_dict['detection_scores'] = output_dict['detection_scores'][0]
              if 'detection_masks' in output_dict:
                output_dict['detection_masks'] = output_dict['detection_masks'][0]
          return output_dict
          

        #image = Image.open(TEST_IMAGE_PATHS)
        # the array based representation of the image will be used later in order to prepare the
        # result image with boxes and labels on it.
        #image_np = load_image_into_numpy_array(TEST_IMAGE_PATHS)
        image_np = TEST_IMAGE_PATHS
        # Expand dimensions since the model expects images to have shape: [1, None, None, 3]
        image_np_expanded = np.expand_dims(image_np, axis=0)
        # Actual detection.
        output_dict = run_inference_for_single_image(image_np, detection_graph)
        # Visualization of the results of a detection.
        vis_util.visualize_boxes_and_labels_on_image_array(
            image_np,
            output_dict['detection_boxes'],
            output_dict['detection_classes'],
            output_dict['detection_scores'],
            category_index,
            instance_masks=output_dict.get('detection_masks'),
            use_normalized_coordinates=True,
            line_thickness=8)
        #plt.figure(figsize=IMAGE_SIZE)
        #plt.imshow(image_np)
        #plt.savefig(str(TEST_IMAGE_PATHS)+".jpg")
        self.lab_decimg_show.setPixmap(self.img2pixmap(image_np))
        self.lab_decimg_show.setScaledContents(True)

## 用於顯示ui介面的命令
if __name__ == "__main__":
    app = QtWidgets.QApplication(sys.argv)
    Window = QtWidgets.QWidget()
    # ui為根據類Ui_From()建立的例項
    ui = UiForm()
    ui.setupUi(Window)
    Window.show()
    sys.exit(app.exec_())

【學習筆記】pyQt5學習筆記(4）——第一個影象識別demoV3.0B

軟體更新日誌V3.0B版本，在2.0基礎上實現了呼叫攝像頭的實時識別功能。V3.0A版若不實時重新整理識別畫面，可以手動點一次識別一次…… 附上完整程式碼，也是做個程式碼備份。需要的小夥伴自取就ok～軟體目前存在的bug是1.在開始識別後會很卡，目前認為可能的原因是每次重新整理

【學習筆記】pyQt5學習筆記(7）——RecursionError: maximum recursion depth exceeded錯誤

同樣的程式，在Ubuntu系統下使用pyinstaller打包沒有問題，在win10下打包提示： RecursionError: maximum recursion depth exceeded 找到的解決方法在這裡，在spec檔案開頭（除了第一行的註釋）新增如下語句： import s

【學習筆記】pyQt5學習筆記(6）——Google object detection API訓練&識別用軟體更新

對訓練軟體和識別軟體均再一次進行更新。針對訓練用軟體，V1.0版本是通過下拉框選擇標註物體的標籤，而下拉框中是我預定義的a~f 6個標籤。因此存在的問題就是標籤不能客製化，且若標記超過6類物體標籤數量不夠。針對這個問題進行了更新，現在允許使用者自己輸入標籤名稱，標籤會儲存在下拉選單中，媽媽再

【學習筆記】pyQt5學習筆記(5）——Google object detection API訓練用軟體

之前的學習筆記是呼叫訓練好的結果來做識別，分為載入本地圖片識別和呼叫usb攝像頭實時識別（IP攝像頭暫時不可用）；但是首先有了訓練才能有訓練好的模型檔案供我們使用。加之訓練過程比較複雜，呼叫多個指令碼，上手不便；製作訓練用的軟體一方面是方便自己使用，另一方面也對自己是個鍛鍊。軟體最終的介面如下圖所示

【學習筆記】pyQt5學習筆記(1）

著手學習pyQt5，今天實現功能，讀取圖片，自適應label的大小並顯示在介面上。個人理解，pyQt5前端用QT designer設計簡單的ui介面，初步規劃除介面佈局及元件，儲存為ui檔案後，通過命令： pyuic5 -o xxxx.py xxxx.ui 將designer生成的ui

【學習筆記】pyQt5學習筆記（8）——windows下pyinstaller打包程式不能訪問ip攝像頭

我的程式需要使用RTSP來訪問IP攝像頭，明明在IDE中執行指令碼沒問題，可是打包之後就無法連線攝像頭，程式出現沒有響應。看到這個博主說的方法，嘗試了一下果然解決了。使用方法：將opencv_ffmpeg345_64.dll拷貝到欲打包的目錄下，然後使用命令： pyinstaller

Turbo51學習筆記（4）第一個程式

在高階語言裡，“Hello world"是經典的第一個程式；在與硬體密切相關的嵌入式程式設計裡，點亮LED燈則更具有代表性。下面的程式碼實現一個LED燈的明、暗迴圈： Program led_test; const flash_time_limit_1=$A0;

【星雲測試】開發者測試（4）-采用精準測試工具對dubbo微服務應用進行測試

星雲測試 term 重命名 text gen 計算方法 url 生產者和消費者 local 簡介：本文主要目的是把現今主流的Dubbo框架項目和精準測試進行對接，通過精準測試的數據穿透、數據采集、測試用例與代碼的雙向追溯、數據分析等一系列精準測試的特有功能達到對項目質量的保

【軟考】——面向物件（4）

Diagram VS Diagram Sequence Diagram VS Collaboration diagram？？？——》同點：在語義上等價，可以相互轉化；？？？——》都是互動

【leetcode 簡單】第七十五題第一個錯誤的版本

nbsp 團隊 logs span 通過 bad log 是否判斷你是產品經理，目前正在帶領一個團隊開發新的產品。不幸的是，你的產品的最新版本沒有通過質量檢測。由於每個版本都是基於之前的版本開發的，所以錯誤的版本之後的所有版本都是錯的。假設你有 n 個版本 [1,

HDU 1711 Number Sequence【KMP】【模板題】【水題】（返回匹配到的第一個字母的位置）

Number Sequence Time Limit: 10000/5000 MS (Java/Others) Memory Limit: 32768/32768 K (Java/Others) Total Submission(s): 29634 Acce

【劍指】面試題50 字串中第一個只出現一次的字元

演算法思想我們可以考慮實現一個簡單的雜湊表，字元是一個長度為8的資料型別，因此共有256中可能。於是我們建立一個長度為256的陣列，每個字母根據其ASCII嗎值作為陣列的下標對應陣列的

【JAVAWEB學習筆記】網上商城實戰4：訂單模塊

接收筆記網上商城詳情 src head 分頁查詢 cnblogs logs 今日任務完成訂單模塊的功能 1.1 訂單模塊的功能 1.1.1 我的訂單：【我的訂單的查詢】 * 在header.jsp中點擊我的訂單. * 提交到Servlet:

【svm學習筆記】svm_理論基礎4

【線性不可分問題之核函式】上面討論的都是線性可分問題，雖然最終也沒看到解的樣子或者解的方法，總之，我們假設已經可以解了。接下來，如果樣本線性不可分，咋整？好辦。記得從前影象處理裡面有個小波變換，大概的意思就是時域效果不好的話，變換到復域效果就好了，變換的名稱我記

【學習筆記】統計學入門（4/7）——正態分佈

來源：http://study.163.com/course/courseMain.htm?courseId=1005232026 索引—— 基本概念連續變數的統計描述分類變數的統計描述正態分佈二項分佈引數估計與可信區間假設檢驗四、正

【安全牛學習筆記】Web掃描器（1）

安全 web 漏洞 1.偵察httrack可將目標網站的網頁全部爬取下來,減少偵察過程中與目標服務器發生的交互。 2.Nikto(1).檢測對象掃描軟件版本搜索存在安全隱患的文件配置漏洞

【K8S學習筆記】Part3：同一Pod中多個容器間使用共享卷進行通信

ash source net def exe tput stat policy container 本文將展示如何使用共享卷（Volume）來實現相同Pod中的兩個容器間通信。註意：本文針對K8S的版本號為v1.9，其他版本可能會有少許不同。 0x00 準備工作需要有一

【Apache Kafka】Kafka學習筆記

local ets prop strong 當前 text 生產 create topic 0x00 基本信息 1、Kafka架構圖 2、環境信息服務器IP：xx.xx.xx.xx 操作系統：CentOS7.2_x64 Kafka版本：kafka_2.12-1.1

【Redis資料庫】命令學習筆記——釋出訂閱、事務、指令碼、連線命令彙總

本篇基於redis 4.0.11版本，學習釋出訂閱、事務、指令碼、連線的相關命令。 Redis 釋出訂閱(pub/sub)是一種訊息通訊模式：傳送者(pub)傳送訊息，訂閱者(sub)接收訊息。序

【學習筆記】前端學習筆記 HTML+CSS+JavaScript+JQuery

學這些太痛苦了，我一定要成為演算法工程師！ HTML 簡介 Hyper Text Mark Language，超文字標記語言，使用一套標記標籤來描述網頁。標籤，開始標籤，結束標籤，標籤內容，屬性。開始標籤後加/來結束，如<br/>。推薦使用小寫。

【學習筆記】pyQt5學習筆記(4）——第一個影象識別demoV3.0B

相關推薦