toshas commited on
Commit
a880811
•
1 Parent(s): 764f76f

add README.md, update model_index.json

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.png filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,3 +1,54 @@
1
  ---
2
  license: apache-2.0
 
 
 
 
 
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: apache-2.0
3
+ language:
4
+ - en
5
+ pipeline_tag: normals-estimation
6
+ tags:
7
+ - monocular normals estimation
8
+ - single image normals estimation
9
+ - normals
10
+ - in-the-wild
11
+ - zero-shot
12
  ---
13
+ # Marigold Normals Model Card
14
+
15
+ This model belongs to the family of diffusion-based Marigold models for solving various computer vision tasks.
16
+ The Marigold Normals model focuses on the surface normals task.
17
+ It takes an input image and computes surface normals in each pixel.
18
+ The Marigold Normals model is trained from Stable Diffusion with synthetic data.
19
+ Thanks to the rich visual knowledge stored in Stable Diffusion, Marigold models possess deep scene understanding and excel at solving computer vision tasks.
20
+ Read more about Marigold in our paper titled "Repurposing Diffusion-Based Image Generators for Monocular Depth Estimation".
21
+
22
+ [![Website](doc/badges/badge-website.svg)](https://marigoldmonodepth.github.io)
23
+ [![GitHub](https://img.shields.io/github/stars/prs-eth/Marigold?style=default&label=GitHub%20★&logo=github)](https://github.com/prs-eth/Marigold)
24
+ [![Paper](doc/badges/badge-pdf.svg)](https://arxiv.org/abs/2312.02145)
25
+ [![Hugging Face Space](https://img.shields.io/badge/🤗%20Hugging%20Face-Space-yellow)](https://huggingface.co/spaces/toshas/marigold)
26
+
27
+ Developed by:
28
+ [Bingxin Ke](http://www.kebingxin.com/),
29
+ [Anton Obukhov](https://www.obukhov.ai/),
30
+ [Shengyu Huang](https://shengyuh.github.io/),
31
+ [Nando Metzger](https://nandometzger.github.io/),
32
+ [Rodrigo Caye Daudt](https://rcdaudt.github.io/),
33
+ [Konrad Schindler](https://scholar.google.com/citations?user=FZuNgqIAAAAJ&hl=en)
34
+
35
+ ![teaser](doc/teaser_collage_transparant.png)
36
+
37
+ ## 🎓 Citation
38
+
39
+ ```bibtex
40
+ @InProceedings{ke2023repurposing,
41
+ title={Repurposing Diffusion-Based Image Generators for Monocular Depth Estimation},
42
+ author={Bingxin Ke and Anton Obukhov and Shengyu Huang and Nando Metzger and Rodrigo Caye Daudt and Konrad Schindler},
43
+ booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
44
+ year={2024}
45
+ }
46
+ ```
47
+
48
+ ## 🎫 License
49
+
50
+ This work is licensed under the Apache License, Version 2.0 (as defined in the [LICENSE](LICENSE.txt)).
51
+
52
+ By downloading and using the code and model you agree to the terms in the [LICENSE](LICENSE.txt).
53
+
54
+ [![License](https://img.shields.io/badge/License-Apache--2.0-929292)](https://www.apache.org/licenses/LICENSE-2.0)
doc/badges/badge-colab.svg ADDED
doc/badges/badge-docker.svg ADDED
doc/badges/badge-license.svg ADDED
doc/badges/badge-pdf.svg ADDED
doc/badges/badge-website.svg ADDED
doc/teaser_collage_transparant.png ADDED

Git LFS Details

  • SHA256: 9ac22708df13690f231aae38a833a49efb38ce0479e3aa14213034fda7aac970
  • Pointer size: 132 Bytes
  • Size of remote file: 5.14 MB
model_index.json CHANGED
@@ -1,25 +1,24 @@
1
  {
2
- "_class_name": "MarigoldNormalsEstimationPipeline",
3
- "_diffusers_version": "0.27.2",
4
- "_name_or_path": "prs-eth/marigold-v1-0",
5
- "scheduler": [
6
- "diffusers",
7
- "DDIMScheduler"
8
  ],
9
- "text_encoder": [
10
- "transformers",
11
- "CLIPTextModel"
12
  ],
13
- "tokenizer": [
14
- "transformers",
15
- "CLIPTokenizer"
16
  ],
17
- "unet": [
18
- "diffusers",
19
- "UNet2DConditionModel"
20
  ],
21
- "vae": [
22
- "diffusers",
23
- "AutoencoderKL"
24
  ]
25
- }
 
1
  {
2
+ "_class_name":"MarigoldPipeline",
3
+ "_diffusers_version":"0.24.0",
4
+ "unet":[
5
+ "diffusers",
6
+ "UNet2DConditionModel"
 
7
  ],
8
+ "vae":[
9
+ "diffusers",
10
+ "AutoencoderKL"
11
  ],
12
+ "scheduler":[
13
+ "diffusers",
14
+ "DDIMScheduler"
15
  ],
16
+ "text_encoder":[
17
+ "transformers",
18
+ "CLIPTextModel"
19
  ],
20
+ "tokenizer":[
21
+ "transformers",
22
+ "CLIPTokenizer"
23
  ]
24
+ }