TVM yolov3优化代码修改（编译运行OK）

2023年7月12日下午2:24 • 人工智能 • 阅读 82

TVM yolov3优化代码修改（编译运行OK）
yolov3_quantize_sample.py

附https://github.com/makihiro/tvm_yolov3_sample代码：
yolov3_quantize_sample.py
import nnvm
import nnvm.frontend.darknet
import nnvm.testing.yolo_detection
import nnvm.testing.darknet
import matplotlib.pyplot as plt
import numpy as np
import tvm
from tvm import rpc
import sys
import cv2
import time

from ctypes import *
from tvm.contrib import util
from tvm.contrib.download import download
from nnvm.testing.darknet import __darknetffi__

Model name
MODEL_NAME = 'yolov3'

######################################################################
Download required files
-----------------------
Download cfg and weights file if first time.

CFG_NAME = MODEL_NAME + '.cfg'
WEIGHTS_NAME = MODEL_NAME + '.weights'
REPO_URL = 'https://github.com/siju-samuel/darknet/blob/master/'
CFG_URL = REPO_URL + 'cfg/' + CFG_NAME + '?raw=true'
WEIGHTS_URL = 'https://pjreddie.com/media/files/' + WEIGHTS_NAME

download(CFG_URL, CFG_NAME)
download(WEIGHTS_URL, WEIGHTS_NAME)

Download and Load darknet library
if sys.platform in ['linux', 'linux2']:
    DARKNET_LIB = 'libdarknet2.0.so'
    DARKNET_URL = REPO_URL + 'lib/' + DARKNET_LIB + '?raw=true'
elif sys.platform == 'darwin':
    DARKNET_LIB = 'libdarknet_mac2.0.so'
    DARKNET_URL = REPO_URL + 'lib_osx/' + DARKNET_LIB + '?raw=true'
else:
    err = "Darknet lib is not supported on {} platform".format(sys.platform)
    raise NotImplementedError(err)

download(DARKNET_URL, DARKNET_LIB)

DARKNET_LIB = __darknetffi__.dlopen('./' + DARKNET_LIB)
cfg = "./" + str(CFG_NAME)
weights = "./" + str(WEIGHTS_NAME)
net = DARKNET_LIB.load_network(cfg.encode('utf-8'), weights.encode('utf-8'), 0)
dtype = 'float32'
batch_size = 1

print("Converting darknet to nnvm symbols...")
sym, params = nnvm.frontend.darknet.from_darknet(net, dtype)

######################################################################
Compile the model on NNVM
-------------------------
compile the model
local = True

if local:
    target = 'llvm'
    ctx = tvm.cpu(0)
else:
    target = 'cuda'
    ctx = tvm.gpu(0)

data = np.empty([batch_size, net.c, net.h, net.w], dtype)
shape = {'data': data.shape}

dtype_dict = {}

convert nnvm to relay
print("convert nnvm symbols into relay function...")
from nnvm.to_relay import to_relay
func, params = to_relay(sym, shape, 'float32', params=params)
optimization
print("optimize relay graph...")
with tvm.relay.build_config(opt_level=2):
    func = tvm.relay.optimize(func, target, params)
quantize
print("apply quantization...")
from tvm.relay import quantize
with quantize.qconfig():
   func = quantize.quantize(func, params)

Relay build
print("Compiling the model...")
print(func.astext(show_meta_data=False))
with tvm.relay.build_config(opt_level=3):
    graph, lib, params = tvm.relay.build(func, target=target, params=params)

Save the model
tmp = util.tempdir()
lib_fname = tmp.relpath('model.tar')
lib.export_library(lib_fname)

NNVM
with nnvm.compiler.build_config(opt_level=2):
    graph, lib, params = nnvm.compiler.build(sym, target, shape, dtype_dict, params)

[neth, netw] = shape['data'][2:]  # Current image shape is 608x608
######################################################################
Execute on TVM Runtime
----------------------
The process is no different from other examples.

from tvm.contrib import graph_runtime

if local:
    remote = rpc.LocalSession()
    ctx = remote.cpu(0)
else:
    # The following is my environment, change this to the IP address of your target device
    host = 'localhost'
    port = 9090
    remote = rpc.connect(host, port)
    ctx = remote.gpu(0)

upload the library to remote device and load it
remote.upload(lib_fname)
rlib = remote.load_module('model.tar')

create the remote runtime module
m = graph_runtime.create(graph, rlib, ctx)
m.set_input(**params)
thresh = 0.5
nms_thresh = 0.45
coco_name = 'coco.names'
coco_url = 'https://github.com/siju-samuel/darknet/blob/master/data/' + coco_name + '?raw=true'
font_name = 'arial.ttf'
font_url = 'https://github.com/siju-samuel/darknet/blob/master/data/' + font_name + '?raw=true'
download(coco_url, coco_name)
download(font_url, font_name)

with open(coco_name) as f:
    content = f.readlines()

names = [x.strip() for x in content]

test image demo
test_image = 'dog.jpg'
print("Loading the test image...")
img_url = 'https://github.com/siju-samuel/darknet/blob/master/data/' + \
          test_image + '?raw=true'
download(img_url, test_image)

data = nnvm.testing.darknet.load_image(test_image, netw, neth)
set inputs
m.set_input('data', tvm.nd.array(data.astype(dtype)))
execute
print("Running the test image...")

m.run()
get outputs
tvm_out = []
for i in range(3):
    layer_out = {}
    layer_out['type'] = 'Yolo'
    # Get the yolo layer attributes (n, out_c, out_h, out_w, classes, total)
    layer_attr = m.get_output(i*4+3).asnumpy()
    layer_out['biases'] = m.get_output(i*4+2).asnumpy()
    layer_out['mask'] = m.get_output(i*4+1).asnumpy()
    out_shape = (layer_attr[0], layer_attr[1] // layer_attr[0],
                 layer_attr[2], layer_attr[3])
    layer_out['output'] = m.get_output(i*4).asnumpy().reshape(out_shape)
    layer_out['classes'] = layer_attr[4]
    tvm_out.append(layer_out)

img = nnvm.testing.darknet.load_image_color(test_image)
_, im_h, im_w = img.shape
dets = nnvm.testing.yolo_detection.fill_network_boxes((netw, neth), (im_w, im_h), thresh,
                                                      1, tvm_out)
last_layer = net.layers[net.n - 1]
nnvm.testing.yolo_detection.do_nms_sort(dets, last_layer.classes, nms_thresh)
nnvm.testing.yolo_detection.draw_detections(img, dets, thresh, names, last_layer.classes)

plt.imshow(img.transpose(1, 2, 0))
plt.show()

video demo
video_demo = False
if video_demo:

    #vcap = cv2.VideoCapture("video.mp4")
    vcap = cv2.VideoCapture(0)

    n_frames = 0
    seconds = 0.0
    fps = 0.0
    while True:
        # Start time
        start = time.time()
        # Capture frame-by-frame
        n_frames = n_frames + 1

        ret, frame = vcap.read()
        img = np.array(frame)
        img = img.transpose((2, 0, 1))
        img = np.divide(img, 255.0)
        img = np.flip(img, 0)
        data = nnvm.testing.darknet._letterbox_image(img, netw, neth)
        # set inputs
        m.set_input('data', tvm.nd.array(data.astype(dtype)))
        # execute
        print("Running the test image...")

        m.run()
        # get outputs
        tvm_out = []

        #tvm_output_list = []
        # for i in range(0, 3):
        #     tvm_output = m.get_output(i)
        #     tvm_output_list.append(tvm_output.asnumpy())
        #print(tvm_output_list)
        #print(m.get_num_outputs())
        #layer_attr = [m.get_output(i).asnumpy() for i in range(m.get_num_outputs())]

        for i in range(3):
            layer_out = {}
            layer_out['type'] = 'Yolo'
            # Get the yolo layer attributes (n, out_c, out_h, out_w, classes, total)
            layer_attr = m.get_output(i*4+3).asnumpy()
            layer_out['biases'] = m.get_output(i*4+2).asnumpy()
            layer_out['mask'] = m.get_output(i*4+1).asnumpy()
            out_shape = (layer_attr[0], layer_attr[1] // layer_attr[0],
                         layer_attr[2], layer_attr[3])
            layer_out['output'] = m.get_output(i*4).asnumpy().reshape(out_shape)
            layer_out['classes'] = layer_attr[4]
            tvm_out.append(layer_out)

        _, im_h, im_w = img.shape
        dets = nnvm.testing.yolo_detection.fill_network_boxes((netw, neth), (im_w, im_h), thresh,
                                                              1, tvm_out)
        last_layer = net.layers[net.n - 1]
        nnvm.testing.yolo_detection.do_nms_sort(dets, last_layer.classes, nms_thresh)
        nnvm.testing.yolo_detection.draw_detections(img, dets, thresh, names, last_layer.classes)
        # End time
        end = time.time()

        # Time elapsed
        seconds = (end - start)
        # Calculate frames per second
        fps = (fps + (1 / seconds)) / 2
        print(fps)
        cv2.putText(img, str(fps), (10, 50), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 3)
        cv2.imshow('Video', img.transpose(1, 2, 0))
        #cv2.waitKey(3)
        # Press Q to stop!

        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
    cv2.destroyAllWindows()

参考链接：
https://github.com/makihiro/tvm_yolov3_sample

Original: https://blog.csdn.net/wujianing_110117/article/details/121449316
Author: wujianming_110117
Title: TVM yolov3优化代码修改（编译运行OK）

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/687814/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

TensorFlow中的Feed和Fetch是什么

问题概述在TensorFlow中，Feed和Fetch是两个重要的概念，用于提供和获取数据。Feed用于将数据传入计算图中的占位符，而Fetch允许我们获取计算图中的任何操作或变…

人工智能 2023年12月31日
0041
机器学习实战 | Python机器学习算法应用实践

作者：韩信子@ShowMeAI教程地址：https://www.showmeai.tech/tutorials/41本文地址：https://www.showmeai.tech/a…

人工智能 2023年7月18日
0054
R语言从列表中移除元素、删除列表中的指定元素（单个元素或者多个元素）

抵扣说明： 1.余额是钱包充值的虚拟货币，按照1:1的比例进行支付金额的抵扣。2.余额无法直接购买下载，可以购买VIP、付费专栏及课程。 Original: https://blo…

人工智能 2023年7月27日
0055
机器学习中的数学——距离定义（六）：马氏距离（Mahalanobis Distance）

马氏距离（Mahalanobis Distance）是由印度统计学家马哈拉诺比斯(P. C. Mahalanobis)提出的，表示数据的协方差距离。它是一种有效的计算两个未知样本集…

人工智能 2023年6月15日
0095
NCCL error in: /pytorch/torch/lib/c10d/ProcessGroupNCCL ,unhandled cuda error, NCCLversion 2.7.8

本文采用方法 pytorch 、cudatoolkit、cuda驱动的版本需一致问题描述使用 多GPU训练 s…

人工智能 2023年7月21日
0052
李宏毅2022机器学习HW2解析

准备工作：去课程github下载原始代码，kaggle下载数据集。或者关注本公众号，下载代码和数据集（文末有方法）。解压数据集，出现libriphone文件夹，将文件和代码放到同…

人工智能 2023年6月15日
00128
Self-Attention机制的计算详解

文章目录 * – 1. Attention的思想 – 2. Self-Attention计算公式 – 3. Self-Attention的计算实…

人工智能 2023年6月15日
0094
如何使用OpenCV在图像中抠出指定的颜色区域

1 简要说明及流程我们往往需要在图像中抠出指定颜色的区域。在实际工况下这种指定颜色不是简单的纯色，往往难以单一的用R G B的某个范围值去确定。本文以PhotoShop为基准,…

人工智能 2023年7月19日
0041
2021电赛F题视觉教程+代码免费开源

2021电赛F题视觉教程+代码免费开源最近好多要电赛题的源码，其他csdn营销号下载都需要会员或钱，正好最近课设又要做一遍电赛小车题，哥们先把代码开源了，饿死营销号电赛宝藏链接…

人工智能 2023年7月3日
0083
力扣（203.1）补9.2

203.移除链表元素第二次做这题，会做，上次做还用的C语言呢。。。 class Solution {public ListNode removeElements(ListNode…

人工智能 2023年6月26日
0080
熬夜整理了2021年Python最新学习资料，分享给学弟学妹们【大学生必备】

Python最新学习资料和视频一、Python软件安装教程视频教程二、学习规划阶段一：Python基础阶段二：Python核心编程阶段三：web前端开发阶段四：数据…

人工智能 2023年6月15日
0053
R语言把dataframe中的字符类型数据列转化为数值类型数据列、使用as.numeric函数

R语言把dataframe中的字符类型数据列转化为数值类型数据列、使用as.numeric函数目录 R语言把dataframe中的字符类型数据列转化为数值类型数据列、使用as.n…

人工智能 2023年6月15日
0084
《基于机器视觉测量系统的工业在线检测研究》论文笔记

《基于机器视觉测量系统的工业在线检测研究》论文笔记基于图像处理的机器视觉在促进工业产品的在线监控水平方面起着巨大功能。它在工业在线检测领域具有广泛的利用前景，因此具有重要的研究价…

人工智能 2023年6月22日
0097
Redis数据库相关指令大合集

14天学习训练营导师课程：郑为中《Vue和SpringBoot打造假日旅社管理系统》努力是为了不平庸~ 学习有些时候是枯燥的，但收获的快乐是加倍的，欢迎记录下你的那些努力时刻（…

人工智能 2023年7月31日
0057
ROS机器人语音模块

ROS机器人语音模块文章目录 * – ROS机器人语音模块 – + 零乘骐骥以驰骋兮，来吾道夫先路 + 壹路漫漫其修远兮，吾将上下而求索 + 贰苟余…

人工智能 2023年5月25日
0077
Pytorch加载模型并进行图像分类预测

1. 整体流程 1）实例化模型 2）加载模型 3）输入图像 4）输出分类结果 5）完整代码 2. 处理图像 1) How can i convert an RGB image in…

人工智能 2023年7月22日
0053

2024 年 5 月
一	二	三	四	五	六	日
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31

TVM yolov3优化代码修改（编译运行OK）

大家都在看