基于yolov5的mjpg-streamer服务器搭建

2023年7月20日下午12:02 • 人工智能 • 阅读 76

前言：使用onnxruntime 加载YOLOV5的onnx模型，基于python版本的http.server搭建mjpg-streamer服务器，使用opencv打开电脑摄像头或RTSP流等完成目标检测后上传到mjpg-streamer后，就可以通过浏览器实时观看检测后的视频流。

一、使用python版本的onnxruntime 加载yolov5模型

import cv2
import numpy as np
import onnxruntime as ort

class yolov5:
    def __init__(self, modelpath, confThreshold=0.5, nmsThreshold=0.5, objThreshold=0.5):
        with open('class.names', 'rt') as f:
            self.classes = f.read().rstrip('\n').split('\n')
        self.num_classes = len(self.classes)
        if modelpath.endswith('6.onnx'):
            self.inpHeight, self.inpWidth = 1280, 1280
            anchors = [[19, 27, 44, 40, 38, 94], [96, 68, 86, 152, 180, 137], [140, 301, 303, 264, 238, 542], [436, 615, 739, 380, 925, 792]]
            self.stride = np.array([8., 16., 32., 64.])
        else:
            self.inpHeight, self.inpWidth = 640, 640
            anchors = [[10, 13, 16, 30, 33, 23], [30, 61, 62, 45, 59, 119], [116, 90, 156, 198, 373, 326]]
            self.stride = np.array([8., 16., 32.])
        self.nl = len(anchors)
        self.na = len(anchors[0]) // 2
        self.grid = [np.zeros(1)] * self.nl
        self.anchor_grid = np.asarray(anchors, dtype=np.float32).reshape(self.nl, -1, 2)
        so = ort.SessionOptions()
        so.log_severity_level = 3
        self.net = ort.InferenceSession(modelpath, so)
        self.confThreshold = confThreshold
        self.nmsThreshold = nmsThreshold
        self.objThreshold = objThreshold
        # self.inpHeight, self.inpWidth = (self.net.get_inputs()[0].shape[2], self.net.get_inputs()[0].shape[3])

    def resize_image(self, srcimg, keep_ratio=True):
        top, left, newh, neww = 0, 0, self.inpWidth, self.inpHeight
        if keep_ratio and srcimg.shape[0] != srcimg.shape[1]:
            hw_scale = srcimg.shape[0] / srcimg.shape[1]
            if hw_scale > 1:
                newh, neww = self.inpHeight, int(self.inpWidth / hw_scale)
                img = cv2.resize(srcimg, (neww, newh), interpolation=cv2.INTER_AREA)
                left = int((self.inpWidth - neww) * 0.5)
                img = cv2.copyMakeBorder(img, 0, 0, left, self.inpWidth - neww - left, cv2.BORDER_CONSTANT,
                                         value=(114, 114, 114))  # add border
            else:
                newh, neww = int(self.inpHeight * hw_scale), self.inpWidth
                img = cv2.resize(srcimg, (neww, newh), interpolation=cv2.INTER_AREA)
                top = int((self.inpHeight - newh) * 0.5)
                img = cv2.copyMakeBorder(img, top, self.inpHeight - newh - top, 0, 0, cv2.BORDER_CONSTANT,
                                         value=(114, 114, 114))
        else:
            img = cv2.resize(srcimg, (self.inpWidth, self.inpHeight), interpolation=cv2.INTER_AREA)
        return img, newh, neww, top, left

    def _make_grid(self, nx=20, ny=20):
        xv, yv = np.meshgrid(np.arange(ny), np.arange(nx))
        return np.stack((xv, yv), 2).reshape((-1, 2)).astype(np.float32)

    def preprocess(self, img):
        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
        img = img.astype(np.float32) / 255.0
        return img

    def postprocess(self, frame, outs, padsize=None):
        frameHeight = frame.shape[0]
        frameWidth = frame.shape[1]
        newh, neww, padh, padw = padsize
        ratioh, ratiow = frameHeight / newh, frameWidth / neww
        # Scan through all the bounding boxes output from the network and keep only the
        # ones with high confidence scores. Assign the box's class label as the class with the highest score.

        confidences = []
        boxes = []
        classIds = []
        for detection in outs:
            if detection[4] > self.objThreshold:
                scores = detection[5:]
                classId = np.argmax(scores)
                confidence = scores[classId] * detection[4]
                if confidence > self.confThreshold:
                    center_x = int((detection[0] - padw) * ratiow)
                    center_y = int((detection[1] - padh) * ratioh)
                    width = int(detection[2] * ratiow)
                    height = int(detection[3] * ratioh)
                    left = int(center_x - width * 0.5)
                    top = int(center_y - height * 0.5)

                    confidences.append(float(confidence))
                    boxes.append([left, top, width, height])
                    classIds.append(classId)
        # Perform non maximum suppression to eliminate redundant overlapping boxes with
        # lower confidences.

        # indices = cv2.dnn.NMSBoxes(boxes, confidences, self.confThreshold, self.nmsThreshold).flatten()
        indices = cv2.dnn.NMSBoxes(boxes, confidences, self.confThreshold, self.nmsThreshold)
        for i in indices:
            box = boxes[i]
            left = box[0]
            top = box[1]
            width = box[2]
            height = box[3]
            frame = self.drawPred(frame, classIds[i], confidences[i], left, top, left + width, top + height)
        return frame

    def drawPred(self, frame, classId, conf, left, top, right, bottom):
        # Draw a bounding box.

        cv2.rectangle(frame, (left, top), (right, bottom), (255, 0, 0), thickness=4)

        label = '%.2f' % conf
        label = '%s:%s' % (self.classes[classId], label)

        # Display the label at the top of the bounding box
        labelSize, baseLine = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)
        top = max(top, labelSize[1])
        # cv.rectangle(frame, (left, top - round(1.5 * labelSize[1])), (left + round(1.5 * labelSize[0]), top + baseLine), (255,255,255), cv.FILLED)
        cv2.putText(frame, label, (left, top - 10), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 0), thickness=2)
        return frame

    def detect(self, srcimg):
        img, newh, neww, padh, padw = self.resize_image(srcimg)
        img = self.preprocess(img)
        # Sets the input to the network
        blob = np.expand_dims(np.transpose(img, (2, 0, 1)), axis=0)

        outs = self.net.run(None, {self.net.get_inputs()[0].name: blob})[0].squeeze(axis=0)

        # inference output
        row_ind = 0
        for i in range(self.nl):
            h, w = int(img.shape[0] / self.stride[i]), int(img.shape[1] / self.stride[i])
            length = int(self.na * h * w)
            if self.grid[i].shape[2:4] != (h, w):
                self.grid[i] = self._make_grid(w, h)

            outs[row_ind:row_ind + length, 0:2] = (outs[row_ind:row_ind + length, 0:2] * 2. - 0.5 + np.tile(
                self.grid[i], (self.na, 1))) * int(self.stride[i])
            outs[row_ind:row_ind + length, 2:4] = (outs[row_ind:row_ind + length, 2:4] * 2) ** 2 * np.repeat(
                self.anchor_grid[i], h * w, axis=0)
            row_ind += length
        srcimg = self.postprocess(srcimg, outs, padsize=(newh, neww, padh, padw))
        return srcimg

二、基于http.server搭建mjpg-streamer服务器

import logging
import socketserver
from threading import Condition, Thread
from PIL import Image
import cv2
import traceback
import io
import time
from http.server import BaseHTTPRequestHandler, HTTPServer
from yolo import yolov5
import threading

class StreamingOutput(object):
    def __init__(self):
        self.frame = None
        self.condition = Condition()

    def write(self, frame):
        with self.condition:
            self.frame = frame
            self.condition.notify_all()

class StreamingHandler(BaseHTTPRequestHandler):
    def do_GET(self):
        # &#x81EA;&#x5B9A;&#x4E49;&#x7F51;&#x7AD9;&#x8BBF;&#x95EE;&#x5730;&#x5740;&#xFF0C;&#x4FEE;&#x6539;self.path&#xFF0C;&#x9ED8;&#x8BA4;http://ip:8000/stream.mjpg
        if self.path == '/stream.mjpg':
            self.send_response(200)
            self.send_header('Age', 0)
            self.send_header('Cache-Control', 'no-cache, private')
            self.send_header('Pragma', 'no-cache')
            self.send_header('Content-Type', 'multipart/x-mixed-replace; boundary=FRAME')
            self.end_headers()
            try:
                while True:
                    with output.condition:
                        output.condition.wait()
                        frame = output.frame
                    self.wfile.write(b'--FRAME\r\n')
                    self.send_header('Content-Type', 'image/jpeg')
                    self.send_header('Content-Length', len(frame))
                    self.end_headers()
                    self.wfile.write(frame)
                    self.wfile.write(b'\r\n')
            except Exception as e:
                traceback.print_exc()
                logging.warning(
                    'Removed streaming client %s: %s',
                    self.client_address, str(e))
        else:
            self.send_error(404)
            self.end_headers()

class StreamingServer(socketserver.ThreadingMixIn, HTTPServer):
    allow_reuse_address = True
    daemon_threads = True

class Camera:
    def __init__(self, output, width, height, framerate, url):
        self.output = output
        self.width = width
        self.height = height
        self.framerate = framerate
        self.url = url

    def __enter__(self):
        # &#x76F8;&#x673A;&#x6216;rtsp&#x6D41;&#x6253;&#x5F00;&#x8DEF;&#x5F84;&#xFF0C;&#x53C2;&#x6570;0&#x8868;&#x793A;&#x6253;&#x5F00;&#x7B14;&#x8BB0;&#x672C;&#x7684;&#x5185;&#x7F6E;&#x6444;&#x50CF;&#x5934;

        self.cap = cv2.VideoCapture(self.url)
        self.cap.set(cv2.CAP_PROP_FRAME_WIDTH, self.width)
        self.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, self.height)
        self.stop_capture = False
        self.thread = Thread(target=self.capture)
        self.thread.start()
        return self

    def __exit__(self, exc_type, exc_value, traceback):
        self.stop_capture = True
        self.thread.join()
        self.cap.release()

    def getIniVal(self, secname, keyname, defVal='', inifile='.\\para.ini'):
        alines = open(inifile, 'r', errors='ignore').readlines()
        findsec = 0
        for linec in alines:
            if linec.find('[' + secname + ']') >= 0:
                findsec = 1
            if linec.find(keyname + '=') >= 0 and findsec == 1:
                return linec[len(keyname) + 1:].strip()
        return defVal

    def capture(self):
        # &#x5B9E;&#x4F8B;&#x5316;&#x4E00;&#x4E2A;yolov5&#x5BF9;&#x8C61;
        yolonet = yolov5(modelpath='weights/yolov5x.onnx', confThreshold=0.3, nmsThreshold=0.5,objThreshold=0.3)
        frame_duration = 1. / self.framerate
        while not self.stop_capture:
            start = time.time()
            ret, frame = self.cap.read()
            if ret:
                frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                srcimg = yolonet.detect(frame)
                img = Image.fromarray(srcimg)
                img.save(self.output, format='JPEG')
            elapsed = time.time() - start
            logging.debug("Frame acquisition time: %.2f" % elapsed)
            if elapsed < frame_duration:
                time.sleep(frame_duration - elapsed)

try:
    output = StreamingOutput()
    # &#x53EF;&#x4EE5;&#x4FEE;&#x6539;&#x89C6;&#x9891;&#x7684;fps&#xFF0C;&#x5BBD;&#x5EA6;&#x548C;&#x9AD8;&#x5EA6;
    with Camera(output, 640, 480, 25, url=0) as camera:
        # &#x8BBF;&#x95EE;&#x5730;&#x5740;&#x548C;&#x7AEF;&#x53E3;
        address = ('', 8000)
        server = StreamingServer(address, StreamingHandler)
        server.serve_forever()
except KeyboardInterrupt:
    pass

三、运行程序

运行yolo_streamer.py程序后访问http://ip:8000/stream.mjpg 基于yolov5的mjpg-streamer服务器搭建 http://ip:8000/stream.mjpg ;

四、查看效果

浏览器打开上面的网页即可在浏览器实时观看效果

五、实验环境

windows10+python3.8+opencv4.5.4+onnxruntime1.10.0

六：项目说明：

此项目只是完成了基本的检测，没有引入多线程来实现同时检测几个摄像头并实时观看，我目前已实现同时拉取三路rtsp流后实现目标检测，并分别上传到不同的网页，这里不详细介绍了，感兴趣的朋友可以尝试二次开发。

七、项目地址

https://github.com/SuperChay/mjpg_streamer-yolov5 基于yolov5的mjpg-streamer服务器搭建 https://github.com/SuperChay/mjpg_streamer-yolov5 ;

Original: https://blog.csdn.net/cy364328541/article/details/123599467
Author: SuperChay
Title: 基于yolov5的mjpg-streamer服务器搭建

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/704902/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

YOLOV7训练专属于自己的目标检测模型（保姆级教程，含数据集预处理）

ubuntu20.04 cuda11.0 cudnn8.0.4 python3.8 torch1.12.0 torchvision0.11.0 （1）把yolov7克隆到本地 gi…

人工智能 2023年6月23日
00121
利用pytorch快速实现分类任务

关于如何快速定义自己的数据集，可以参考我的前一篇文章PyTorch中快速加载自定义数据（入门）_晨曦473的博客-CSDN博客刚开始学习PyTorch，找了很多自定义数据加载的方法…

人工智能 2023年7月1日
00130
动手学深度学习（九+）——softmax分类Fashion-MNIST数据集

文章目录 * – 一、Fashion-MNIST数据集 – + 1.1 认识数据集 + 1.2 小批量读取数据 – 二、softmax回归从零开…

人工智能 2023年6月17日
00151
数电学习（十、脉冲波形的产生和整形）（三）

抵扣说明： 1.余额是钱包充值的虚拟货币，按照1:1的比例进行支付金额的抵扣。2.余额无法直接购买下载，可以购买VIP、C币套餐、付费专栏及课程。 Original: https:…

人工智能 2023年6月28日
00109
在自己的数据集上重新训练BERT（附代码）

最近有需要在新的领域进一步训练BERT，因此参照了hugging face官方文档写了相应的代码。本文采用的是hugging face提供的checkpoint，并在相应的task…

人工智能 2023年6月16日
00136
膨胀卷积（Dilated convolutions）（又叫空洞卷积、扩张卷积）

一、背景论文： Multi-Scale Context Aggregation by Dilated Convolutions 大部分图像分割的框架都是经历一系列的卷积和下采样的…

人工智能 2023年6月16日
00103
人工智能十大流行算法

人工智能是什么？很多人都知道，但大多又都说不清楚。事实上，人工智能已经存在于我们生活中很久了。比如我们常常用到的邮箱，其中垃圾邮件过滤就是依靠人工智能；比如每个智能手机都配备…

人工智能 2023年7月25日
0087
python实现朴素贝叶斯算法

本次实验的任务是文本分类，所用数据集为20news_bydate实验流程主要如下：一、算法介绍· 朴素贝叶斯算法是应用最为广泛的分类算法之一。· 给定训练数据集X，其类别为Y，则有…

人工智能 2023年6月15日
0097
人工智能不仅应当提高物质福利，而且应当满足人类的精神需求

然而，遵循阿西莫夫三定律而建造的人工智能或者机器人是奴隶般的，它们在社会上运行可以帮助人类整体，但它们奴隶般的地位是我们人类希望的吗？这是技术社会的理想形态吗？弗洛里迪说：&#82…

人工智能 2023年5月31日
00125
Ubuntu18.04安装ROS-melodic（使用国内镜像源，很快就能玩小乌龟了）

版本选择每个Ubuntu版本都对应不同的ROS版本，我使用的是 Ubuntu18.04，对应的版本是 ROS-melodic 建议先给Ubuntu也把源换了，不管下载什么都要方便…

人工智能 2023年6月2日
0093
医疗图像切割日记 01 – 用nnUNet做Fatal Head Segmentation Challenge

目录 1. nnUNet 介绍 1.1 nnUNet 特点 2. 准备工作 2.1 整理数据格式 – 用自己的数据集 2.2 设置路径 2.3 nnUNet预处理数据 …

人工智能 2023年6月20日
00126
深度学习相关阅读论文汇总（持续更新）

注意：按我文件夹的顺序更新的 77 A Ranking-Based Cross-Entropy Loss for Early Classification of Time Seri…

人工智能 2023年7月13日
0091
L1和L2正则化

1 过拟合问题过拟合是数据科学领域的一个重要问题，需要处理好过拟合问题才能建立一个健壮和准确的模型。当模型试图很好的拟合训练数据但导致无法泛化到测试数据时，就出现了过拟合。过拟合…

人工智能 2023年7月16日
0081
Unity -Demo 之 ✨ 接入“科大讯飞”语音识别SDK（完整）

抵扣说明： 1.余额是钱包充值的虚拟货币，按照1:1的比例进行支付金额的抵扣。2.余额无法直接购买下载，可以购买VIP、C币套餐、付费专栏及课程。 Original: https:…

人工智能 2023年5月25日
00118
从零实现深度学习框架——动手实现Softmax回归

; 引言本着”凡我不能创造的，我就不能理解”的思想，本系列文章会基于纯Python以及NumPy从零创建自己的深度学习框架，该框架类似PyTorch能实现…

人工智能 2023年6月17日
00118
小徐科研日记——深度学习视频分类方法

一、主要方法视频分类指将一段视频分类到预先制定类别集合中的某一个或多个。视频由空间维度和时间维度组成。包括静态图像特征，运动特征，音频特征，外部特征等。目前主要的方法有：双流网络…

人工智能 2023年7月27日
00128

2024 年 5 月
一	二	三	四	五	六	日
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31