Commit
•
b868983
1
Parent(s):
f8a3fd5
Revert "Change model to fp32"
Browse filesThis reverts commit f8a3fd514f81ab0f83bfb286620f18a878ec02d0.
- Makefile +3 -2
- model_repository/dinov2_vitl14/1/model.plan +2 -2
Makefile
CHANGED
@@ -19,7 +19,8 @@ trt:
|
|
19 |
"trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
|
20 |
--minShapes=input:1x3x560x560 \
|
21 |
--optShapes=input:2x3x560x560 \
|
22 |
-
--maxShapes=input:8x3x560x560
|
|
|
23 |
|
24 |
|
25 |
triton:
|
@@ -31,5 +32,5 @@ triton:
|
|
31 |
tritonserver --model-repository=/models
|
32 |
|
33 |
perf:
|
34 |
-
docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:
|
35 |
|
|
|
19 |
"trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
|
20 |
--minShapes=input:1x3x560x560 \
|
21 |
--optShapes=input:2x3x560x560 \
|
22 |
+
--maxShapes=input:8x3x560x560 \
|
23 |
+
--fp16"
|
24 |
|
25 |
|
26 |
triton:
|
|
|
32 |
tritonserver --model-repository=/models
|
33 |
|
34 |
perf:
|
35 |
+
docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:8001 --concurrency-range 16:16 --shape input:3,560,560
|
36 |
|
model_repository/dinov2_vitl14/1/model.plan
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8d32cc4f1324b661d1770102ba25e826e5a40f6bad9692f2e1ca5b00f417693
|
3 |
+
size 46068060
|