Depth-Anything

Sleeping

LiheYoung commited on Jan 23

Commit

116da01

•

1 Parent(s): 2493a1e

Load from Hugging Face

Files changed (2) hide show

depth_anything/dpt.py CHANGED Viewed

@@ -1,8 +1,10 @@
 import torch
 import torch.nn as nn
-from .blocks import FeatureFusionBlock, _make_scratch
 import torch.nn.functional as F
 def _make_fusion_block(features, use_bn, size = None):
@@ -143,7 +145,6 @@ class DPT_DINOv2(nn.Module):
         # in case the Internet connection is not stable, please load the DINOv2 locally
         if localhub:
             self.pretrained = torch.hub.load('torchhub/facebookresearch_dinov2_main', 'dinov2_{:}14'.format(encoder), source='local', pretrained=False)
-            # self.pretrained.load_state_dict(torch.load('checkpoints/dinov2_{:}14_pretrain.pth'.format(encoder)))
         else:
             self.pretrained = torch.hub.load('facebookresearch/dinov2', 'dinov2_{:}14'.format(encoder))
@@ -165,7 +166,22 @@ class DPT_DINOv2(nn.Module):
         return depth.squeeze(1)
 if __name__ == '__main__':
-    depth_anything = DPT_DINOv2()
-    depth_anything.load_state_dict(torch.load('checkpoints/depth_anything_dinov2_vitl14.pth'))

+import argparse
 import torch
 import torch.nn as nn
 import torch.nn.functional as F
+from huggingface_hub import PyTorchModelHubMixin, hf_hub_download
+from depth_anything.blocks import FeatureFusionBlock, _make_scratch
 def _make_fusion_block(features, use_bn, size = None):
         # in case the Internet connection is not stable, please load the DINOv2 locally
         if localhub:
             self.pretrained = torch.hub.load('torchhub/facebookresearch_dinov2_main', 'dinov2_{:}14'.format(encoder), source='local', pretrained=False)
         else:
             self.pretrained = torch.hub.load('facebookresearch/dinov2', 'dinov2_{:}14'.format(encoder))
         return depth.squeeze(1)
+class DepthAnything(DPT_DINOv2, PyTorchModelHubMixin):
+    def __init__(self, config):
+        super().__init__(**config)
 if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--encoder",
+        default="vits",
+        type=str,
+        choices=["vits", "vitb", "vitl"],
+    )
+    args = parser.parse_args()
+    model = DepthAnything.from_pretrained("LiheYoung/depth_anything_{:}14".format(args.encoder))
+    print(model)

requirements.txt CHANGED Viewed

@@ -1,4 +1,6 @@
 gradio_imageslider
 torch
 torchvision
 opencv-python

 gradio_imageslider
+gradio==4.14.0
 torch
 torchvision
 opencv-python
+huggingface_hub