yolov5支持动态batch_size、插入nms节点

最新推荐文章于 2025-01-08 19:07:39 发布

jstzwjr

最新推荐文章于 2025-01-08 19:07:39 发布

阅读量638

点赞数 1

CC 4.0 BY-SA版权

文章标签： YOLO

本文链接：https://blog.csdn.net/qq_17127427/article/details/132717133

文章讲述了如何使用Python库如`importonnx`和`graphsurgeonasgs`在Yolov5的QAT.onnx模型中实现动态batchsize和NMS功能，以增强模型的灵活性和性能。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

import onnx
import onnx_graphsurgeon as gs
import numpy as np

# 增加class_names和动态batchsize
labels = ['mouse']
names = {cls_id: label for cls_id, label in enumerate(labels)}

model = onnx.load("/wjr/develop/projects/yolov5/qat.onnx")

meta = model.metadata_props.add()
meta.key, meta.value = "names", str(names)

graph = model.graph
graph.input[0].type.tensor_type.shape.dim[0].dim_param = 'None'
onnx.save(model, f'/wjr/develop/projects/yolov5/qat2.onnx')


# 插入nms节点
n_cls = 1
# 1.加载模型
graph = gs.import_onnx(onnx.load("/wjr/develop/projects/yolov5/qat2.onnx"))


# 首先将b*n*(4+n_cls)的输出split成b*n*1*4和b*n*n_cls两个部分
# 定义split节点
split = gs.Constant("split", values=np.array([4, n_cls], dtype=np.int64))
output_box_0 = gs.Variable(
    name="output_box_0", shape=(1, 25500, 4), dtype=np.float32)
output_scores = gs.Variable(
    name="output_scores", shape=(1, 25500, n_cls), dtype=np.float32)
split_node = gs.Node(
    op="Split",
    inputs=[graph.outputs[0], split],
    outputs=[output_box_0, output_scores],
    attrs={"axis": 2}
)

# box reshape，增加一个维度
box_shape = gs.Constant(
    "shape", values=np.array([1, 25500, 1, 4], dtype=np.int64))
output_boxes = gs.Variable(
    name="output_boxes", shape=(1, 25500, 1, 4), dtype=np.float32)
# 增加reshape节点
reshape_node = gs.Node(
    op="Reshape", inputs=[output_box_0, box_shape], outputs=[output_boxes])

# 定义batchednms节点
# keepTopK最终保留的目标数，是batchednms节点的属性
# num_detections返回每个输入检测到的目标数
keepTopK = 100
topK = 1000
num_detections = gs.Variable(
    name="num_detections", dtype=np.int32, shape=[1])
# nmsed_boxes返回每个输入检测到box坐标
nmsed_boxes = gs.Variable(name="nmsed_boxes", dtype=np.float32, shape=[
                          1, keepTopK, 4])
# nmsed_scores返回每个输入检测到的box对应的score
nmsed_scores = gs.Variable(name="nmsed_scores",
                           dtype=np.float32, shape=[1, keepTopK])
# nmsed_classes返回每个输入检测到的box对应的类别id
nmsed_classes = gs.Variable(name="nmsed_classes",
                            dtype=np.float32, shape=[1, keepTopK])

new_outputs = [num_detections, nmsed_boxes, nmsed_scores, nmsed_classes]
# 创建nms节点
# 首先定义nms节点的属性
attrs = {}
attrs["shareLocation"] = False # nms不同类别box是否统一处理
attrs["backgroundLabelId"] = -1  # 背景类id，没有背景则设置为-1
attrs["numClasses"] = n_cls
attrs["topK"] = topK    # number of bounding boxes for nms eg 1000s
attrs["keepTopK"] = keepTopK # bounding boxes to be kept per image eg 20
attrs["scoreThreshold"] = 0.50 #0.70
attrs["iouThreshold"] = 0.7 
attrs["isNormalized"] = False   # 输入box坐标是否经过归一化
attrs["clipBoxes"] = False      # 当isNormalized为True时才生效，对box做clip处理
attrs['scoreBits'] = 16
# attrs["plugin_version"] = "1"
# attrs["caffeSemantics"] = True

nms_node = gs.Node(
    op="BatchedNMSDynamic_TRT",   # 不能使用BatchedNMS_TRT，不支持动态batch size
    attrs=attrs,
    inputs=[output_boxes, output_scores],
    outputs=new_outputs
)

# 将节点插入到nodes列表中
graph.nodes.extend([split_node, reshape_node, nms_node])
# 更新graph的输出
graph.outputs = new_outputs

graph.cleanup().toposort()
onnx.save(gs.export_onnx(graph), "/wjr/develop/projects/yolov5/qat3.onnx")