| { | |
| "model_id": "Alpha-VLLM/Lumina-Image-2.0", | |
| "downloads": 10219, | |
| "tags": [ | |
| "diffusers", | |
| "safetensors", | |
| "text-to-image", | |
| "arxiv:2503.21758", | |
| "license:apache-2.0", | |
| "diffusers:Lumina2Pipeline", | |
| "region:us" | |
| ], | |
| "description": "--- pipeline_tag: text-to-image library_name: diffusers license: apache-2.0 --- !Lumina-Image 2.0 Lumina-Image-2.0 is a 2 billion parameter flow-based diffusion transformer capable of generating images from text descriptions. For more information, visit our GitHub. ## Gradio Demo We provide an official Gradio demo. You can use the link we provided to try it out. ## Usage This is a Hugging Face Diffusers implementation of the paper Lumina-Image 2.0: A Unified and Efficient Image Generative Framework. ## Citation If you find the provided code or models useful for your research, consider citing them as:", | |
| "model_explanation_gemini": "Generates images from text descriptions using a 2B parameter flow-based diffusion transformer. \n\nFeatures: \n- Text-to-image generation \n- 2 billion parameter architecture \n- Flow-based diffusion transformer \n- Hugging Face Diffusers implementation \n\nComparison: Not explicitly compared to other models in the description.", | |
| "release_year": "2024", | |
| "parameter_count": null, | |
| "is_fine_tuned": false, | |
| "category": "Diffusion", | |
| "api_enhanced": true | |
| } |