add README.md, update model_index.json
Browse files- .gitattributes +1 -0
- README.md +51 -0
- doc/badges/badge-colab.svg +33 -0
- doc/badges/badge-docker.svg +29 -0
- doc/badges/badge-license.svg +27 -0
- doc/badges/badge-pdf.svg +27 -0
- doc/badges/badge-website.svg +129 -0
- doc/teaser_collage_transparant.png +3 -0
- model_index.json +18 -19
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
*.png filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
@@ -1,3 +1,54 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
+
language:
|
4 |
+
- en
|
5 |
+
pipeline_tag: normals-estimation
|
6 |
+
tags:
|
7 |
+
- monocular normals estimation
|
8 |
+
- single image normals estimation
|
9 |
+
- normals
|
10 |
+
- in-the-wild
|
11 |
+
- zero-shot
|
12 |
---
|
13 |
+
# Marigold Normals Model Card
|
14 |
+
|
15 |
+
This model belongs to the family of diffusion-based Marigold models for solving various computer vision tasks.
|
16 |
+
The Marigold Normals model focuses on the surface normals task.
|
17 |
+
It takes an input image and computes surface normals in each pixel.
|
18 |
+
The Marigold Normals model is trained from Stable Diffusion with synthetic data.
|
19 |
+
Thanks to the rich visual knowledge stored in Stable Diffusion, Marigold models possess deep scene understanding and excel at solving computer vision tasks.
|
20 |
+
Read more about Marigold in our paper titled "Repurposing Diffusion-Based Image Generators for Monocular Depth Estimation".
|
21 |
+
|
22 |
+
[![Website](doc/badges/badge-website.svg)](https://marigoldmonodepth.github.io)
|
23 |
+
[![GitHub](https://img.shields.io/github/stars/prs-eth/Marigold?style=default&label=GitHub%20★&logo=github)](https://github.com/prs-eth/Marigold)
|
24 |
+
[![Paper](doc/badges/badge-pdf.svg)](https://arxiv.org/abs/2312.02145)
|
25 |
+
[![Hugging Face Space](https://img.shields.io/badge/🤗%20Hugging%20Face-Space-yellow)](https://huggingface.co/spaces/toshas/marigold)
|
26 |
+
|
27 |
+
Developed by:
|
28 |
+
[Bingxin Ke](http://www.kebingxin.com/),
|
29 |
+
[Anton Obukhov](https://www.obukhov.ai/),
|
30 |
+
[Shengyu Huang](https://shengyuh.github.io/),
|
31 |
+
[Nando Metzger](https://nandometzger.github.io/),
|
32 |
+
[Rodrigo Caye Daudt](https://rcdaudt.github.io/),
|
33 |
+
[Konrad Schindler](https://scholar.google.com/citations?user=FZuNgqIAAAAJ&hl=en)
|
34 |
+
|
35 |
+
![teaser](doc/teaser_collage_transparant.png)
|
36 |
+
|
37 |
+
## 🎓 Citation
|
38 |
+
|
39 |
+
```bibtex
|
40 |
+
@InProceedings{ke2023repurposing,
|
41 |
+
title={Repurposing Diffusion-Based Image Generators for Monocular Depth Estimation},
|
42 |
+
author={Bingxin Ke and Anton Obukhov and Shengyu Huang and Nando Metzger and Rodrigo Caye Daudt and Konrad Schindler},
|
43 |
+
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
|
44 |
+
year={2024}
|
45 |
+
}
|
46 |
+
```
|
47 |
+
|
48 |
+
## 🎫 License
|
49 |
+
|
50 |
+
This work is licensed under the Apache License, Version 2.0 (as defined in the [LICENSE](LICENSE.txt)).
|
51 |
+
|
52 |
+
By downloading and using the code and model you agree to the terms in the [LICENSE](LICENSE.txt).
|
53 |
+
|
54 |
+
[![License](https://img.shields.io/badge/License-Apache--2.0-929292)](https://www.apache.org/licenses/LICENSE-2.0)
|
doc/badges/badge-colab.svg
ADDED
doc/badges/badge-docker.svg
ADDED
doc/badges/badge-license.svg
ADDED
doc/badges/badge-pdf.svg
ADDED
doc/badges/badge-website.svg
ADDED
doc/teaser_collage_transparant.png
ADDED
Git LFS Details
|
model_index.json
CHANGED
@@ -1,25 +1,24 @@
|
|
1 |
{
|
2 |
-
"_class_name":
|
3 |
-
"_diffusers_version":
|
4 |
-
"
|
5 |
-
|
6 |
-
|
7 |
-
"DDIMScheduler"
|
8 |
],
|
9 |
-
"
|
10 |
-
|
11 |
-
|
12 |
],
|
13 |
-
"
|
14 |
-
|
15 |
-
|
16 |
],
|
17 |
-
"
|
18 |
-
|
19 |
-
|
20 |
],
|
21 |
-
"
|
22 |
-
|
23 |
-
|
24 |
]
|
25 |
-
}
|
|
|
1 |
{
|
2 |
+
"_class_name":"MarigoldPipeline",
|
3 |
+
"_diffusers_version":"0.24.0",
|
4 |
+
"unet":[
|
5 |
+
"diffusers",
|
6 |
+
"UNet2DConditionModel"
|
|
|
7 |
],
|
8 |
+
"vae":[
|
9 |
+
"diffusers",
|
10 |
+
"AutoencoderKL"
|
11 |
],
|
12 |
+
"scheduler":[
|
13 |
+
"diffusers",
|
14 |
+
"DDIMScheduler"
|
15 |
],
|
16 |
+
"text_encoder":[
|
17 |
+
"transformers",
|
18 |
+
"CLIPTextModel"
|
19 |
],
|
20 |
+
"tokenizer":[
|
21 |
+
"transformers",
|
22 |
+
"CLIPTokenizer"
|
23 |
]
|
24 |
+
}
|