# 先配置 ngc key, passwd is your ngc key
docker login nvcr.io
docker pull nvcr.io/nvidia/tritonserver:25.02-vllm-python-py3
docker run -it --gpus all --name "ui-tars" --net host nvcr.io/nvidia/tritonserver:25.02-vllm-python-py3
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python3 | |
# Generation Command: polygraphy run --gen test.py my_define_network.py --trt --fp16 --load-inputs inputs.json --load-outputs layerwise_golden.json --check-error-stat median --atol 0.1 --rtol 0.1 | |
# It will check against outputs stored in layerwise_golden.json | |
from polygraphy.logger import G_LOGGER | |
from polygraphy import func | |
from polygraphy.backend.trt import NetworkFromOnnxPath | |
import tensorrt as trt | |
from polygraphy import util |