参考文档
https://docs.djangoproject.com/zh-hans/5.0/intro/tutorial01/
待验证 onnx转换成引擎
import tensorrt as trt
# 设置日志器
logger = trt.Logger(trt.Logger.WARNING)
# 创建 TensorRT 运行时
runtime = trt.Runtime(logger)
# 创建 TensorRT 构建器和网络
builder = trt.Builder(logger)
network = builder.create_network(1 << int(trt.NetworkDefinitionCreationFlag.EXPLICIT_BATCH))
# 创建 ONNX 解析器
parser = trt.OnnxParser(network, logger)
# 加载 ONNX 模型
with open("model.onnx", "rb") as model_file:
parser.parse(model_file.read())
# 配置构建器
config = builder.create_builder_config()
config.max_workspace_size = 1 << 30 # 设置最大工作空间为 1GB
# 构建 TensorRT 引擎
engine = builder.build_engine(network, config)
# 保存 TensorRT 引擎
with open("model.trt", "wb") as engine_file:
engine_file.write(engine.serialize())
print("TensorRT 引擎已成功保存到 model.trt")