RoundtTble commited on
Commit
b868983
1 Parent(s): f8a3fd5

Revert "Change model to fp32"

Browse files

This reverts commit f8a3fd514f81ab0f83bfb286620f18a878ec02d0.

Makefile CHANGED
@@ -19,7 +19,8 @@ trt:
19
  "trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
20
  --minShapes=input:1x3x560x560 \
21
  --optShapes=input:2x3x560x560 \
22
- --maxShapes=input:8x3x560x560"
 
23
 
24
 
25
  triton:
@@ -31,5 +32,5 @@ triton:
31
  tritonserver --model-repository=/models
32
 
33
  perf:
34
- docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:6001 --concurrency-range 16:16 --shape input:3,560,560
35
 
 
19
  "trtexec --onnx=onnx/model.onnx --saveEngine=$(MODEL_PATH)/model.plan \
20
  --minShapes=input:1x3x560x560 \
21
  --optShapes=input:2x3x560x560 \
22
+ --maxShapes=input:8x3x560x560 \
23
+ --fp16"
24
 
25
 
26
  triton:
 
32
  tritonserver --model-repository=/models
33
 
34
  perf:
35
+ docker run --gpus all --rm -it --net host nvcr.io/nvidia/tritonserver:23.04-py3-sdk perf_analyzer -m dinov2_vitl14 --percentile=95 -i grpc -u 0.0.0.0:8001 --concurrency-range 16:16 --shape input:3,560,560
36
 
model_repository/dinov2_vitl14/1/model.plan CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:562a3f73d2826bf6cf828e9a83f8775d11981f9fa65c1489311708fae6cfb6a2
3
- size 90532324
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8d32cc4f1324b661d1770102ba25e826e5a40f6bad9692f2e1ca5b00f417693
3
+ size 46068060