RoundtTble
commited on
Commit
•
f8a3fd5
1
Parent(s):
bdd3916
Change model to fp32
Browse files- Makefile +2 -3
- model_repository/dinov2_vitl14/1/model.plan +2 -2
Makefile
CHANGED
@@ -19,8 +19,7 @@ trt:
|
|
19 |
"trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
|
20 |
--minShapes=input:1x3x560x560 \
|
21 |
--optShapes=input:2x3x560x560 \
|
22 |
-
--maxShapes=input:8x3x560x560
|
23 |
-
--fp16"
|
24 |
|
25 |
|
26 |
triton:
|
@@ -32,5 +31,5 @@ triton:
|
|
32 |
tritonserver --model-repository=/models
|
33 |
|
34 |
perf:
|
35 |
-
docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:
|
36 |
|
|
|
19 |
"trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
|
20 |
--minShapes=input:1x3x560x560 \
|
21 |
--optShapes=input:2x3x560x560 \
|
22 |
+
--maxShapes=input:8x3x560x560"
|
|
|
23 |
|
24 |
|
25 |
triton:
|
|
|
31 |
tritonserver --model-repository=/models
|
32 |
|
33 |
perf:
|
34 |
+
docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:6001 --concurrency-range 16:16 --shape input:3,560,560
|
35 |
|
model_repository/dinov2_vitl14/1/model.plan
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:562a3f73d2826bf6cf828e9a83f8775d11981f9fa65c1489311708fae6cfb6a2
|
3 |
+
size 90532324
|