Skip to content

Instantly share code, notes, and snippets.

UI-TARS 本地部署

环境

# 先配置 ngc key, passwd is your ngc key
docker login nvcr.io
docker pull nvcr.io/nvidia/tritonserver:25.02-vllm-python-py3
docker run -it --gpus all --name "ui-tars" --net host nvcr.io/nvidia/tritonserver:25.02-vllm-python-py3
#!/usr/bin/env python3
# Generation Command: polygraphy run --gen test.py my_define_network.py --trt --fp16 --load-inputs inputs.json --load-outputs layerwise_golden.json --check-error-stat median --atol 0.1 --rtol 0.1
# It will check against outputs stored in layerwise_golden.json
from polygraphy.logger import G_LOGGER
from polygraphy import func
from polygraphy.backend.trt import NetworkFromOnnxPath
import tensorrt as trt
from polygraphy import util