aarondevstack commited on
Commit
738a247
·
1 Parent(s): 71465c3

feat: initial upload of 1024x1024 DepthPro CoreML models

Browse files
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956d38a0917e09b44a3b4021c6d78537a8f94a6786537434ea156419aa3f6203
3
+ size 43505
DepthPro_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:835e2e1b5669a0829e10f05ea488398a2c2700c5bd6ac2923d313d71f8938523
3
+ size 36977600
DepthPro_decoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "1E21BD8D-AA95-4FDB-BC46-63DA38064C53": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "583B1644-7ECF-415C-AB5D-9856FC45FC2A": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "1E21BD8D-AA95-4FDB-BC46-63DA38064C53"
18
+ }
DepthPro_depth.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea9b97a3ba6eace7c0db6d3ec70803ec4421a068abde2669c81da7ab60e16b40
3
+ size 251713
DepthPro_depth.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1bfe93ab1fe0b313838c697e013b6cd90fd0a42657407d4da9e0d359dc1cbad
3
+ size 609335296
DepthPro_depth.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "9CED9AF1-2245-4AF9-B316-5B462C7DE2C4": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "CB5CA919-9A1F-4FB2-87E7-D8D7EA19B653": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "9CED9AF1-2245-4AF9-B316-5B462C7DE2C4"
18
+ }
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa60d4e13dee22215616497ab586e0861a9f86c73030302460e31f10c83f329
3
+ size 954323
DepthPro_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e582e80dfe67489c4afd6f4e551c7669ae84da80728451d737790b4f5438285
3
+ size 1255288640
DepthPro_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "6DED6546-056A-43C5-A77B-9E59676594F4": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "9CFDD29B-5A8F-449C-958B-C05ED5D7AB25": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "6DED6546-056A-43C5-A77B-9E59676594F4"
18
+ }
DepthPro_transform.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04bb60c3adddd9d378bfd18987e5b7b96930c9fe24b23acb24079b7076dc500b
3
+ size 1446
DepthPro_transform.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "5D664207-AC2D-411E-A29D-17DBE2A243A1": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Weights",
7
+ "name": "weights",
8
+ "path": "com.apple.CoreML/weights"
9
+ },
10
+ "CDDE2568-8A25-44D7-AF87-24C0C45E49B8": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "CDDE2568-8A25-44D7-AF87-24C0C45E49B8"
18
+ }
README.md CHANGED
@@ -1,3 +1,51 @@
1
  ---
2
  license: apple-ascl
 
 
 
 
 
 
 
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: apple-ascl
3
+ library_name: coreml
4
+ tags:
5
+ - depth-estimation
6
+ - visionos
7
+ - apple-silicon
8
+ - amlr
9
+ - computer-vision
10
+ - depth-pro
11
+ - 1024x1024
12
+ extra_gated_heading: DepthPro CoreML (High-Resolution 1024px)
13
+ extra_gated_button_content: Access Model
14
  ---
15
+
16
+ # DepthPro CoreML (1024x1024 High-Resolution)
17
+
18
+ This repository contains the **High-Resolution (1024x1024)** version of the DepthPro model, optimized for CoreML.
19
+
20
+ DepthPro is a state-of-the-art monocular depth estimation model that provides sharp, metric-scale depth maps. This 1024px version is specifically designed for **High-Quality 3D Exports** where edge precision and fine detail preservation are critical.
21
+
22
+ ## 🚀 Key Features
23
+ - **High Fidelity**: Captures thin structures (threads, instruments, hair) with superior accuracy compared to the 512px version.
24
+ - **Symmetric 3D Rendering Optimized**: Perfectly suited for symmetric shifting in VR/AR to minimize visual discomfort.
25
+ - **VisionOS Ready**: Fully compatible with Apple Vision Pro (optimized for GPU/CPU).
26
+
27
+ ## 📊 Performance & Requirements
28
+ | Metric | Specification |
29
+ | :--- | :--- |
30
+ | **Input Resolution** | 1024 x 1024 pixels |
31
+ | **Compute Units** | GPU + CPU (Recommended for stability) |
32
+ | **Average Latency** | ~7.5s per frame (on M2 Ultra/M3 Max) |
33
+ | **Target Use Case** | Offline Video Conversion / High-Quality Spatial Video Export |
34
+
35
+ > [!IMPORTANT]
36
+ > To ensure inference stability at this resolution, this model is configured to use the **GPU/CPU path** rather than ANE to avoid memory limits.
37
+
38
+ ## 📦 Repository Contents
39
+ The repository contains the following core components:
40
+ 1. `DepthPro_transform.mlpackage`: Image preprocessing.
41
+ 2. `DepthPro_encoder.mlpackage`: Feature extraction (ViT-Large).
42
+ 3. `DepthPro_decoder.mlpackage`: Multiresolution fusion.
43
+ 4. `DepthPro_depth.mlpackage`: Final depth output and high-res feature generation.
44
+
45
+ ## 🛠 Usage with Swift Transformers
46
+ You can download and cache this model dynamically using `swift-transformers`:
47
+
48
+ ```swift
49
+ let hub = Hub()
50
+ let modelDir = try await hub.snapshot(repoId: "aarondevstack/DepthPro-1024x1024-coreml")
51
+ // Load models from the downloaded directory