日常摸鱼系列

程序员文章站 2022-04-21 10:38:02

把别人训练好的yolo3模型的权重，调过来看看import numpy as npimport cv2 as cvimport osimport timepath = 'D:/Code/Python/YOLO3'weightsPath = os.path.join(path, 'yolov3.weights') # 权重文件configPath = os.path.join(path, 'yolov3.cfg') # 配置文件labelsPath = os.path.join(path...

把别人训练好的yolo3模型的权重，调过来看看

import numpy as np
import cv2 as cv
import os
import time

path = 'D:/Code/Python/YOLO3'
weightsPath = os.path.join(path, 'yolov3.weights')  # 权重文件
configPath = os.path.join(path, 'yolov3.cfg')  # 配置文件
labelsPath = os.path.join(path, 'coco.names')  # label名称
imgPath = os.path.join(path, 'dog.jpg')  # 测试图像
CONFIDENCE = 0.5  # 过滤弱检测的最小概率
THRESHOLD = 0.4  # 非最大值抑制阈值
# 加载网络、配置权重
net = cv.dnn.readNetFromDarknet(configPath, weightsPath)  # #  利用下载的文件
print("[INFO] loading YOLO from disk...")  # # 可以打印下信息
#打开摄像头，读取视频
cv.namedWindow("Photo_Detect")  #定义一个窗口
video=cv.VideoCapture(0) #捕获摄像头图像  0位默认的摄像头 笔记本的自带摄像头  1为外界摄像头
def object_dect(img):
    blobImg = cv.dnn.blobFromImage(img, 1.0 / 255.0, (416, 416), None, True,False)  # # net需要的输入是blob格式的，用blobFromImage这个函数来转格式
    net.setInput(blobImg)  # # 调用setInput函数将图片送入输入层
    # 获取网络输出层信息（所有输出层的名字），设定并前向传播
    outInfo = net.getUnconnectedOutLayersNames()  # # 前面的yolov3架构也讲了，yolo在每个scale都有输出，outInfo是每个scale的名字信息，供net.forward使用
    layerOutputs = net.forward(outInfo)  # 得到各个输出层的、各个检测框等信息，是二维结构。
    (H, W) = img.shape[:2]
    boxes = []  # 所有边界框（各层结果放一起）
    confidences = []  # 所有置信度
    classIDs = []  # 所有分类ID
    for out in layerOutputs:  # 各个输出层
        for detection in out:  # 各个框框
            # 拿到置信度
            scores = detection[5:]  # 各个类别的置信度
            classID = np.argmax(scores)  # 最高置信度的id即为分类id
            confidence = scores[classID]  # 拿到置信度
            # 根据置信度筛查
            if confidence > CONFIDENCE:
                box = detection[0:4] * np.array([W, H, W, H])  # 将边界框放会图片尺寸
                (centerX, centerY, width, height) = box.astype("int")
                x = int(centerX - (width / 2))
                y = int(centerY - (height / 2))
                boxes.append([x, y, int(width), int(height)])
                confidences.append(float(confidence))
                classIDs.append(classID)
    # # 2）应用非最大值抑制(non-maxima suppression，nms)进一步筛掉
    idxs = cv.dnn.NMSBoxes(boxes, confidences, CONFIDENCE, THRESHOLD)  # boxes中，保留的box的索引index存入idxs
    # 得到labels列表
    with open(labelsPath, 'rt') as f:
        labels = f.read().rstrip('\n').split('\n')
    # 应用检测结果
    np.random.seed(42)
    COLORS = np.random.randint(0, 255, size=(len(labels), 3),dtype="uint8")  # 框框显示颜色，每一类有不同的颜色，每种颜色都是由RGB三个值组成的，所以size为(len(labels), 3)
    if len(idxs) > 0:
        for i in idxs.flatten():  # indxs是二维的，第0维是输出层，所以这里把它展平成1维
            (x, y) = (boxes[i][0], boxes[i][1])
            (w, h) = (boxes[i][2], boxes[i][3])
            color = [int(c) for c in COLORS[classIDs[i]]]
            cv.rectangle(img, (x, y), (x + w, y + h), color, 2)  # 线条粗细为2px
            text = "{}: {:.4f}".format(labels[classIDs[i]], confidences[i])
            cv.putText(img, text, (x, y - 5), cv.FONT_HERSHEY_SIMPLEX, 0.5, color,2)  # cv.FONT_HERSHEY_SIMPLEX字体风格、0.5字体大小、粗细2px
            cv.imshow('detected image', img)
#循环摄像头的视频
while(True):                  #值为1不断读取图像
    ret, img = video.read()  #视频捕获帧
    object_dect(img)
    if cv.waitKey(1) & 0xFF == ord('Q'):   #按Q关闭所有窗口  一次没反应的话就多按几下
        break
#执行完后释放窗口
video.release()  # 释放捕获
cv.destroyAllWindows()  # 摧毁全部窗体

本文地址：https://blog.csdn.net/LJP1924804579/article/details/109614979

日常摸鱼系列

FIF互动帮助手册系列－HTML手册 flash版

WPF之图片处理系列

谷歌Pixel 3系列手机新壁纸曝光将在10月9日于美国和欧洲发布

sql server 备份与恢复系列六文件组备份与还原

MySQL OOM 系列一 Linux内存分配

Mysql精粹系列(精粹)

iOS开发系列--详细介绍数据存取

浅谈Java设计模式系列-装饰器模式

详解Mysql中的JSON系列操作函数

iOS开发系列--详细讲解C语言之存储方式和作用域

日常摸鱼系列

FIF互动帮助手册系列－HTML手册 flash版

WPF之图片处理系列

谷歌Pixel 3系列手机新壁纸曝光 将在10月9日于美国和欧洲发布

sql server 备份与恢复系列六 文件组备份与还原

MySQL OOM 系列一 Linux内存分配

Mysql精粹系列(精粹)

iOS开发系列--详细介绍数据存取

浅谈Java设计模式系列-装饰器模式

详解Mysql中的JSON系列操作函数

iOS开发系列--详细讲解C语言之存储方式和作用域

谷歌Pixel 3系列手机新壁纸曝光将在10月9日于美国和欧洲发布

sql server 备份与恢复系列六文件组备份与还原