Yolox目标检测训练实录–1. 数据准备

2023年7月10日上午9:49 • 人工智能 • 阅读 63


git clone git@github.com:Megvii-BaseDetection/YOLOX.git
cd YOLOX
pip3 install -v -e .

conda create -n yolox python=3.7
conda activate yolox

#如果你切换了国内的源可以把后面的-c pytorch去掉。
conda install pytorch=1.7 torchvision cudatoolkit=10.2 -c pytorch`

git clone git@github.com:Megvii-BaseDetection/YOLOX.git
cd YOLOX
pip install -r requirements.txt
python setup.py develop

python tools/demo.py image -f exps/default/yolox_s.py -c yolox_s.pth --path assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result --device gpu

使用Python把原始数据中的car类别挑选出来

import xml.etree.ElementTree as ET
import os

def newImageSets(oldSets, newSets):

    savelist = []

    with open(oldSets, 'r') as f:
        for line in f.readlines():

            ids = int(line)
            path_i = 'Annotations/%06d.xml'%ids
            if os.path.exists(path_i):
                print(path_i)
                savelist.append(line)

    with open(newSets, 'a') as f1:
        for id in savelist:
            f1.write(id)

    return

def selectCarAnn(srcAnnPath, dstAnnPath):

    srcPath = os.path.join(srcAnnPath, "%06d.xml")
    dstPath = os.path.join(dstAnnPath, "%06d.xml")

    count = 0

    for id in range(1,9964):
        _path = srcPath % id
        rootTree = ET.parse(_path)
        target = rootTree.getroot()

        carFlag = False
        for obj in target.iter("object"):
            name = obj.find("name").text.strip()

            if name == 'car':
                carFlag = True

        if carFlag:
            count += 1

            rm_list = []
            for obj in target.iter("object"):
                name = obj.find("name").text.strip()

                if name != 'car':
                    rm_list.append(obj)

            for o in rm_list:
                target.remove(o)

            rootTree.write(dstPath%id)

    print(count)

    return

def main():

    selectCarAnn("Annotations", "Annotations_new")

    newImageSets("ImageSets/Main/test.txt", "ImageSets/Main/test_new.txt")

    return

if __name__ == '__main__':
    main()

import scipy.io as scio
import cv2
import random
import colorsys
import os

def loadbox(data):
    out = []
    for box in data['boxes'][0]:
        p0 = box[0][0][0]
        p1 = box[0][0][1]
        p2 = box[0][0][2]
        p3 = box[0][0][3]
        res = []
        res.append(p0[0])
        res.append(p1[0])
        res.append(p2[0])
        res.append(p3[0])

        out.append(res)
    return out
def get_n_hls_colors(num):
    hls_colors = []
    i = 0
    step = 360.0 / num
    while i < 360:
        h = i
        s = 90 + random.random() * 10
        l = 50 + random.random() * 10
        _hlsc = [h / 360.0, l / 100.0, s / 100.0]
        hls_colors.append(_hlsc)
        i += step

    return hls_colors
def ncolors(num):
    rgb_colors = []
    if num < 1:
        return rgb_colors
    hls_colors = get_n_hls_colors(num)
    for hlsc in hls_colors:
        _r, _g, _b = colorsys.hls_to_rgb(hlsc[0], hlsc[1], hlsc[2])
        r, g, b = [int(x * 255.0) for x in (_r, _g, _b)]
        rgb_colors.append([r, g, b])

    return rgb_colors

def drawImg(boxes, img):
    print(img.shape)
    n = len(boxes)
    colors = ncolors(n)

    for bb in boxes:
        n -= 1
        color = (colors[n][2], colors[n][1], colors[n][0])
        pt0 = (int(bb[0][1]), int(bb[0][0]))
        pt1 = (int(bb[1][1]), int(bb[1][0]))
        pt2 = (int(bb[2][1]), int(bb[2][0]))
        pt3 = (int(bb[3][1]), int(bb[3][0]))

        min_x = min(int(bb[0][1]), int(bb[1][1]), int(bb[2][1]), int(bb[3][1]))
        max_x = max(int(bb[0][1]), int(bb[1][1]), int(bb[2][1]), int(bb[3][1]))
        min_y = min(int(bb[0][0]), int(bb[1][0]), int(bb[2][0]), int(bb[3][0]))
        max_y = max(int(bb[0][0]), int(bb[1][0]), int(bb[2][0]), int(bb[3][0]))

        cv2.rectangle(img, (min_x, min_y), (max_x, max_y),color, 1)

    return 0

def process_single_pair(imgPath, matPath):
    img = cv2.imread(imgPath)
    data = scio.loadmat(matPath)
    drawImg(loadbox(data), img)

    cv2.imshow("tt", img)

    return 0

def vis_folder(imgFolder, matFolder):
    files = os.listdir(imgFolder)
    for f in files:
        if f.endswith(".jpg"):
            imgPath = os.path.join(imgFolder, f)
            print(imgPath)
            matPath = os.path.join(matFolder, f[:-3] + "mat")
            if os.path.exists(imgPath) and os.path.exists(matPath) :
                process_single_pair(imgPath, matPath)
                if cv2.waitKey(0) == ord('q'):
                    cv2.destroyAllWindows()
                    break

    return 0

if __name__ == '__main__':
    vis_folder("test_dataset/test_data/images/","test_dataset/test_data/annotations/")

hand dataset 转换为 voc格式的代码

import copy
import scipy.io as scio
import cv2
import os
import xml.etree.ElementTree as ET

class HandData2VOC():
    def __init__(self):
        self.srcHandAnnotationsDir = "hand_dataset/annotations/"
        self.dstHandAnnotationsDir = "voc_style/Annotations/"
        self.imageDir = 'voc_style/JPEGImages/'
        self.imageSets = 'voc_style/ImageSets/'

        self.xmlAnnotation = "000004.xml"

    def test(self):

        return

    def runTransfor(self, matName):
        rootTree = ET.parse(self.xmlAnnotation)
        target = rootTree.getroot()
        saveDir = os.path.join(self.dstHandAnnotationsDir, matName[:-3]+"xml")

        nodeFolder = target.find('folder')
        nodeFolder.text = "Hand_data"

        imageName = matName[:-3] + 'jpg'
        nodeFileName = target.find("filename")
        nodeFileName.text = imageName

        imgDir = os.path.join(self.imageDir, imageName)

        img = cv2.imread(imgDir)
        h,w,c = img.shape

        nodeSize = target.find('size')
        nodewidth = nodeSize.find('width')
        nodewidth.text = str(w)
        nodeheight = nodeSize.find("height")
        nodeheight.text = str(h)
        nodec = nodeSize.find("depth")
        nodec.text = str(c)

        objNodei = target.find("object")
        objNodei.find("name").text = "hand"

        matDir = os.path.join(self.srcHandAnnotationsDir, matName)
        data = scio.loadmat(matDir)

        boxes_data = data['boxes'][0]
        numBox = len(boxes_data)
        print("==============4. numBox: ", numBox)
        if numBox == 0:
            print('----------------------->: ', matName)
            return 0
        if numBox > 0:

            box = boxes_data[0]
            p0 = box[0][0][0][0]
            p1 = box[0][0][1][0]
            p2 = box[0][0][2][0]
            p3 = box[0][0][3][0]
            min_x = min(int(p0[1]), int(p1[1]), int(p2[1]), int(p3[1]))
            max_x = max(int(p0[1]), int(p1[1]), int(p2[1]), int(p3[1]))
            min_y = min(int(p0[0]), int(p1[0]), int(p2[0]), int(p3[0]))
            max_y = max(int(p0[0]), int(p1[0]), int(p2[0]), int(p3[0]))

            nodeBndBox = objNodei.find("bndbox")
            nodeBndBox.find("xmin").text = str(min_x)
            nodeBndBox.find("ymin").text = str(min_y)
            nodeBndBox.find("xmax").text = str(max_x)
            nodeBndBox.find("ymax").text = str(max_y)

            for bb in data['boxes'][0][1:]:
                nodeObjCp = copy.deepcopy(objNodei)
                p_0 = bb[0][0][0][0]
                p_1 = bb[0][0][1][0]
                p_2 = bb[0][0][2][0]
                p_3 = bb[0][0][3][0]
                xmin = min(int(p_0[1]), int(p_1[1]), int(p_2[1]), int(p_3[1]))
                xmax = max(int(p_0[1]), int(p_1[1]), int(p_2[1]), int(p_3[1]))
                ymin = min(int(p_0[0]), int(p_1[0]), int(p_2[0]), int(p_3[0]))
                ymax = max(int(p_0[0]), int(p_1[0]), int(p_2[0]), int(p_3[0]))

                nodeBndBoxi = nodeObjCp.find("bndbox")
                nodeBndBoxi.find("xmin").text = str(xmin)
                nodeBndBoxi.find("ymin").text = str(ymin)
                nodeBndBoxi.find("xmax").text = str(xmax)
                nodeBndBoxi.find("ymax").text = str(ymax)
                target.append(nodeObjCp)
                print(xmin," ", ymin," ", xmax," ", ymax)
            rootTree.write(saveDir)
            print("===========save: ", saveDir)

        return 1

    def run(self):
        annotations = os.listdir(self.srcHandAnnotationsDir)

        setDir = os.path.join(self.imageSets, "test0.txt")
        with open(setDir, 'w') as file:

            for mat in annotations:

                if self.runTransfor(mat):
                    file.write(mat[:-4]+"\n")

        return 0

完整数据和代码提取码：1fut

数据处理结束，检查一下处理的效果如何：

import numpy as np
def parserXml(xmlPath):
    target = ET.parse(xmlPath).getroot()

    res = np.empty((0, 5))
    for obj in target.iter("object"):
        difficult = obj.find("difficult")
        if difficult is not None:
            difficult = int(difficult.text) == 1
        else:
            difficult = False
        if not 1 and difficult:
            continue
        name = obj.find("name").text.strip()
        bbox = obj.find("bndbox")

        pts = ["xmin", "ymin", "xmax", "ymax"]
        bndbox = []
        for i, pt in enumerate(pts):
            cur_pt = int(float(bbox.find(pt).text)) - 1

            bndbox.append(cur_pt)
        label_idx = 1
        bndbox.append(label_idx)
        res = np.vstack((res, bndbox))

    width = int(target.find("size").find("width").text)
    height = int(target.find("size").find("height").text)
    img_info = (height, width)
    print(img_info)

    return res

def showVocStyleData(imgDir, annDir):

    for ann in os.listdir(annDir):
        annPath = os.path.join(annDir, ann)
        imgPath = os.path.join(imgDir, ann[:-3]+"jpg")

        img = cv2.imread(imgPath)
        print(img.shape)

        res = parserXml(annPath)

        for i in range(res.shape[0]):
            resi = res[i]
            print(resi)
            cv2.rectangle(img, (int(resi[0]), int(resi[1])), (int(resi[2]), int(resi[3])),(0,200,0),2)

        cv2.imshow('test', img)

        if cv2.waitKey(0) & 0xff == 27:
            cv2.destroyAllWindows()
            break

    return

Original: https://blog.csdn.net/weixin_45331269/article/details/123608147
Author: young_s%
Title: Yolox目标检测训练实录–1. 数据准备

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/682549/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

python复制dataframe_Python Pandas复制和修改datafram中的一些行

我觉得在熊猫身上没有什么特别好的方法。每当一个DataFrame包含一列列表，并且您想进行某种需要在列表上迭代的计算，您就必须为列中的每个项(即list)调用一次Python函数…

人工智能 2023年7月7日
0058
[pytorch] RCNN物体检测的简化实现（d2l-香蕉数据集）

论文地址RCNN物体检测的主要步骤如下：训练：监督预训练：利用ILSVRC 2012进行预训练，lr=0.01 在VOC 2012 train上微调：将CNN最后的1000分类初…

人工智能 2023年7月22日
0098
HRSC2016 数据集 L2 L3 task

网上没有HRSC2016 数据集 L2 L3 task 任务的开源项目，我的毕设跟老师吹的牛是把数据集用到L2、L3任务上，现在发现没有开源代码，心态没了。接下来这段时间尝试手写代…

人工智能 2023年6月17日
0069
DJLJava环境下部署pytorch模型推理

由于大数据基本都是Java环境，希望与深度学习结合的话，需要将深度学习模型部署在Java环境下。传统方式使用flask搭建接口，在Java环境中对其调用，但通信时间和内存问题限制了…

人工智能 2023年7月24日
0057
机器学习库Scikit-Learn（线性模型、岭回归、插入一列数据（insert）、提取所需列、向量机（SVM）、聚类）

本文来自《Python数据分析从入门到精通》-明日科技编著机器学习顾名思义就是让机器（计算机）模拟人类学习，有效提高工作效率。Python提供的第三方库Scikit-Learn融…

人工智能 2023年6月2日
0071
2022年好用的无线蓝牙耳机，性价比最高的学生党蓝牙耳机推荐

如今的蓝牙耳机已经是我们生活中必不可少的物品，它再也不是简单的听音乐工具了，现在的蓝牙耳机不仅可以听音乐，接听电话，还能唤醒语音助手等功能。但是，目前蓝牙耳机的同质化现象非常严重，…

人工智能 2023年5月25日
00102
引力搜索算法极限学习机GSA-ELM回归预测及其MATLAB代码实现

[ 引力搜索算法（Gravitational Search Algorithm， GSA）是一种基于引力_模拟的优化算法，它模拟天体之间的 _引力_作用，并通过 _引力_和质量…

人工智能 2023年6月29日
0080
使用C语言实现矩阵转置（稀疏矩阵）

目录 1.转置矩阵（普通矩阵） 2.转置矩阵（稀疏矩阵）（1）稀疏矩阵（2）稀疏矩阵的压缩存储方式（3）理论运算方法 1.转置矩阵（普通矩阵）矩阵的转置：根据主对角元素作为…

人工智能 2023年7月4日
0052
支持哪些硬件加速

问题背景在计算机领域，硬件加速是指使用专门的硬件设备来加速计算任务的执行速度。硬件加速可以在很多领域得到应用，如图形处理、机器学习、密码学等。本文将以图形处理为例，介绍支持硬件加…

人工智能 2023年12月31日
0032
ResNeXt网络解析

ResNeXt是ResNet和Inception的结合体.ResNeXt借鉴Inception的”分割-变换-聚合”策略（即split-transform-…

人工智能 2023年7月13日
0077
一个既能做CV任务，也能做NLP任务的Transformer模型！谷歌&UCLA提出统一的基础模型…

关注公众号，发现CV技术之美本文分享论文『Towards a Uniﬁed Foundation Model: Jointly Pre-Training Transformer…

人工智能 2023年5月31日
0072
【Python刷题篇】——Python入门 07 循环语句（上）

抵扣说明： 1.余额是钱包充值的虚拟货币，按照1:1的比例进行支付金额的抵扣。2.余额无法直接购买下载，可以购买VIP、C币套餐、付费专栏及课程。 Original: https:…

人工智能 2023年6月3日
0059
最新目标检测算法回顾2022笔记

目标检测算法回顾2022笔记[附PPT] 总目录篇章1：目标检测的应用与需求篇章2：目标检测的定义与挑战篇章3：目标检测损失函数的进展篇章4：目标检测IOU的发展历程篇章…

人工智能 2023年6月22日
0068
将DataFrame转化为Excel

学习pandas第三天，将会每天坚持打卡学习就学习，如果觉得有帮助可以点赞一哈！！！ # 1.将DataFrame保存为Excel 1）下面是DataFrame文件 2）通过下面这…

人工智能 2023年7月6日
0069
ImageNet数据集简介与下载详细步骤

ImagNet与ILSVRC简介 ImageNet是一种数据集，而不是神经网络模型。斯坦福大学教授李飞飞为了解决机器学习中过拟合和泛化的问题而牵头构建的数据集。该数据集从2007年…

人工智能 2023年6月15日
00510
resnet18实现猫狗图片的分类

简介使用猫狗分类数据集中的训练集，共25000张图片。将原始训练集进行拆分，其中20000张用于训练，其余5000张用于测试。分类网络使用ResNet-18，使用了交叉熵损失函数…

人工智能 2023年7月2日
0076

2024 年 4 月
一	二	三	四	五	六	日
1	2	3	4	5	6	7
8	9	10	11	12	13	14
15	16	17	18	19	20	21
22	23	24	25	26	27	28
29	30

Yolox目标检测训练实录–1. 数据准备

大家都在看