aarondevstack commited on
Commit ·
14ff16b
1
Parent(s): 305b807
feat: initial upload of 512x512 DepthPro CoreML models
Browse files- DepthPro_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_decoder.mlpackage/Manifest.json +18 -0
- DepthPro_depth.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_depth.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_depth.mlpackage/Manifest.json +18 -0
- DepthPro_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_encoder.mlpackage/Manifest.json +18 -0
- DepthPro_transform.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_transform.mlpackage/Manifest.json +18 -0
- README.md +32 -0
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0777b77bff92bed422a6dcd8636831f17f294252e779d3c42a6a44c6ca5bcd1
|
| 3 |
+
size 44093
|
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06156744bbb4202b57e042a1638aab8addac9a934ceb383d4185a067ab638477
|
| 3 |
+
size 36977600
|
DepthPro_decoder.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"341606E2-CA63-4173-9594-991789F9E809": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"6686BC52-DA2A-42B1-9C1E-C50E57DBB1B0": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "6686BC52-DA2A-42B1-9C1E-C50E57DBB1B0"
|
| 18 |
+
}
|
DepthPro_depth.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a6a0c6dc2b4a9d23799e9867f0e4d6b7f34c010bd2fcd8160c29a5a2d68616b
|
| 3 |
+
size 251713
|
DepthPro_depth.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec705b7425f315869ac3f394f13787f44fb1f191c7f31d911a3f77b3f504c093
|
| 3 |
+
size 609335296
|
DepthPro_depth.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"6B4EEB53-4969-4FEF-A454-71A28AC6ADAB": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"C047E3E0-282A-4EA9-9373-BA698D76FFB9": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "C047E3E0-282A-4EA9-9373-BA698D76FFB9"
|
| 18 |
+
}
|
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44614936d9717f42f27cf5675f11e5b06c9d1f297f7ca1ff599ed631efc65978
|
| 3 |
+
size 558107
|
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d07f012c3a2b60abcf554d2b7eafe0b07bf5e3adbd4e27de4230460eeac38dd4
|
| 3 |
+
size 1255190336
|
DepthPro_encoder.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"522298C7-1BD7-4178-80D6-1320C7FD094E": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"64383B13-BCCE-4BD7-A9C4-A73FC732834E": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "522298C7-1BD7-4178-80D6-1320C7FD094E"
|
| 18 |
+
}
|
DepthPro_transform.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0a33f01ba1aebf2c1c34b2a24775509e98e6edaddc3864f8ecb12c026efaf6a
|
| 3 |
+
size 1446
|
DepthPro_transform.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"0261DB25-260F-4EFD-B40D-75BB2410912F": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"42670EF3-3C7E-434C-B9C4-5DAAD7E897CF": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "42670EF3-3C7E-434C-B9C4-5DAAD7E897CF"
|
| 18 |
+
}
|
README.md
CHANGED
|
@@ -1,3 +1,35 @@
|
|
| 1 |
---
|
| 2 |
license: apple-ascl
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
---
|
| 2 |
license: apple-ascl
|
| 3 |
+
library_name: coreml
|
| 4 |
+
tags:
|
| 5 |
+
- apple
|
| 6 |
+
- amlr
|
| 7 |
+
- computer-vision
|
| 8 |
+
- depth-estimation
|
| 9 |
+
- visionos
|
| 10 |
+
- macos
|
| 11 |
---
|
| 12 |
+
|
| 13 |
+
# DepthPro: High-Resolution Monocular Depth (CoreML)
|
| 14 |
+
|
| 15 |
+
This repository provides CoreML-optimized weights for **DepthPro**, adapted for on-device inference on visionOS and macOS.
|
| 16 |
+
|
| 17 |
+
## Configuration
|
| 18 |
+
- **Resolution**: 512x512 (Optimized for <1s inference)
|
| 19 |
+
- **Precision**: Float16
|
| 20 |
+
- **Architecture**: Multi-scale ViT-Large with Sharp Boundary Refinement
|
| 21 |
+
|
| 22 |
+
## Performance (M2 Apple Vision Pro)
|
| 23 |
+
- **Transform + Encoder**: ~700ms (GPU Fallback)
|
| 24 |
+
- **Decoder + Depth Head**: ~150ms
|
| 25 |
+
- **Total Pipeline**: < 1.0s per frame
|
| 26 |
+
|
| 27 |
+
## Citation
|
| 28 |
+
If you use this model in your research or applications, please cite the original work:
|
| 29 |
+
```bibtex
|
| 30 |
+
@article{Bochkovskii2024:DepthPro,
|
| 31 |
+
title={DepthPro: Sharp Monocular Depth Estimation with Full-Resolution Refinement},
|
| 32 |
+
author={Bochkovskii, Alexey and Fogosar, Ambron and Koltun, Vladlen},
|
| 33 |
+
journal={arXiv preprint arXiv:2410.02073},
|
| 34 |
+
year={2024}
|
| 35 |
+
}
|