aarondevstack commited on
Commit ·
738a247
1
Parent(s): 71465c3
feat: initial upload of 1024x1024 DepthPro CoreML models
Browse files- DepthPro_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_decoder.mlpackage/Manifest.json +18 -0
- DepthPro_depth.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_depth.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_depth.mlpackage/Manifest.json +18 -0
- DepthPro_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- DepthPro_encoder.mlpackage/Manifest.json +18 -0
- DepthPro_transform.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- DepthPro_transform.mlpackage/Manifest.json +18 -0
- README.md +48 -0
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:956d38a0917e09b44a3b4021c6d78537a8f94a6786537434ea156419aa3f6203
|
| 3 |
+
size 43505
|
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:835e2e1b5669a0829e10f05ea488398a2c2700c5bd6ac2923d313d71f8938523
|
| 3 |
+
size 36977600
|
DepthPro_decoder.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"1E21BD8D-AA95-4FDB-BC46-63DA38064C53": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"583B1644-7ECF-415C-AB5D-9856FC45FC2A": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "1E21BD8D-AA95-4FDB-BC46-63DA38064C53"
|
| 18 |
+
}
|
DepthPro_depth.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea9b97a3ba6eace7c0db6d3ec70803ec4421a068abde2669c81da7ab60e16b40
|
| 3 |
+
size 251713
|
DepthPro_depth.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1bfe93ab1fe0b313838c697e013b6cd90fd0a42657407d4da9e0d359dc1cbad
|
| 3 |
+
size 609335296
|
DepthPro_depth.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"9CED9AF1-2245-4AF9-B316-5B462C7DE2C4": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"CB5CA919-9A1F-4FB2-87E7-D8D7EA19B653": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "9CED9AF1-2245-4AF9-B316-5B462C7DE2C4"
|
| 18 |
+
}
|
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fa60d4e13dee22215616497ab586e0861a9f86c73030302460e31f10c83f329
|
| 3 |
+
size 954323
|
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e582e80dfe67489c4afd6f4e551c7669ae84da80728451d737790b4f5438285
|
| 3 |
+
size 1255288640
|
DepthPro_encoder.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"6DED6546-056A-43C5-A77B-9E59676594F4": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"9CFDD29B-5A8F-449C-958B-C05ED5D7AB25": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "6DED6546-056A-43C5-A77B-9E59676594F4"
|
| 18 |
+
}
|
DepthPro_transform.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04bb60c3adddd9d378bfd18987e5b7b96930c9fe24b23acb24079b7076dc500b
|
| 3 |
+
size 1446
|
DepthPro_transform.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"5D664207-AC2D-411E-A29D-17DBE2A243A1": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"CDDE2568-8A25-44D7-AF87-24C0C45E49B8": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "CDDE2568-8A25-44D7-AF87-24C0C45E49B8"
|
| 18 |
+
}
|
README.md
CHANGED
|
@@ -1,3 +1,51 @@
|
|
| 1 |
---
|
| 2 |
license: apple-ascl
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
---
|
| 2 |
license: apple-ascl
|
| 3 |
+
library_name: coreml
|
| 4 |
+
tags:
|
| 5 |
+
- depth-estimation
|
| 6 |
+
- visionos
|
| 7 |
+
- apple-silicon
|
| 8 |
+
- amlr
|
| 9 |
+
- computer-vision
|
| 10 |
+
- depth-pro
|
| 11 |
+
- 1024x1024
|
| 12 |
+
extra_gated_heading: DepthPro CoreML (High-Resolution 1024px)
|
| 13 |
+
extra_gated_button_content: Access Model
|
| 14 |
---
|
| 15 |
+
|
| 16 |
+
# DepthPro CoreML (1024x1024 High-Resolution)
|
| 17 |
+
|
| 18 |
+
This repository contains the **High-Resolution (1024x1024)** version of the DepthPro model, optimized for CoreML.
|
| 19 |
+
|
| 20 |
+
DepthPro is a state-of-the-art monocular depth estimation model that provides sharp, metric-scale depth maps. This 1024px version is specifically designed for **High-Quality 3D Exports** where edge precision and fine detail preservation are critical.
|
| 21 |
+
|
| 22 |
+
## 🚀 Key Features
|
| 23 |
+
- **High Fidelity**: Captures thin structures (threads, instruments, hair) with superior accuracy compared to the 512px version.
|
| 24 |
+
- **Symmetric 3D Rendering Optimized**: Perfectly suited for symmetric shifting in VR/AR to minimize visual discomfort.
|
| 25 |
+
- **VisionOS Ready**: Fully compatible with Apple Vision Pro (optimized for GPU/CPU).
|
| 26 |
+
|
| 27 |
+
## 📊 Performance & Requirements
|
| 28 |
+
| Metric | Specification |
|
| 29 |
+
| :--- | :--- |
|
| 30 |
+
| **Input Resolution** | 1024 x 1024 pixels |
|
| 31 |
+
| **Compute Units** | GPU + CPU (Recommended for stability) |
|
| 32 |
+
| **Average Latency** | ~7.5s per frame (on M2 Ultra/M3 Max) |
|
| 33 |
+
| **Target Use Case** | Offline Video Conversion / High-Quality Spatial Video Export |
|
| 34 |
+
|
| 35 |
+
> [!IMPORTANT]
|
| 36 |
+
> To ensure inference stability at this resolution, this model is configured to use the **GPU/CPU path** rather than ANE to avoid memory limits.
|
| 37 |
+
|
| 38 |
+
## 📦 Repository Contents
|
| 39 |
+
The repository contains the following core components:
|
| 40 |
+
1. `DepthPro_transform.mlpackage`: Image preprocessing.
|
| 41 |
+
2. `DepthPro_encoder.mlpackage`: Feature extraction (ViT-Large).
|
| 42 |
+
3. `DepthPro_decoder.mlpackage`: Multiresolution fusion.
|
| 43 |
+
4. `DepthPro_depth.mlpackage`: Final depth output and high-res feature generation.
|
| 44 |
+
|
| 45 |
+
## 🛠 Usage with Swift Transformers
|
| 46 |
+
You can download and cache this model dynamically using `swift-transformers`:
|
| 47 |
+
|
| 48 |
+
```swift
|
| 49 |
+
let hub = Hub()
|
| 50 |
+
let modelDir = try await hub.snapshot(repoId: "aarondevstack/DepthPro-1024x1024-coreml")
|
| 51 |
+
// Load models from the downloaded directory
|