Spaces:

leditsplusplus
/

project

Running

project / index.html

Linoy Tsaban

Update index.html

3eb9a39 over 1 year ago

14 kB

	<!DOCTYPE html>
	<html>
	<head>
	<meta charset="utf-8">
	<meta name="description"
	content="LEdits++ Limitless Image Editing using Text-to-Image Models">
	<meta name="keywords"
	content="LEDITS++, DPM solver++ inversion, LEDITS, semantic guidance, SEGA, real image editing">
	<meta name="viewport" content="width=device-width, initial-scale=1">
	<title> LEDITS++: Limitless Image Editing using Text-to-Image Models </title>

	<link href="https://fonts.googleapis.com/css?family=Google+Sans\|Noto+Sans\|Castoro"
	rel="stylesheet">

	<link rel="stylesheet" href="./static/css/bulma.min.css">
	<link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
	<link rel="stylesheet" href="./static/css/bulma-slider.min.css">
	<link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
	<link rel="stylesheet"
	href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
	<link rel="stylesheet" href="./static/css/index.css">
	<link rel="icon" href="./static/images/painting-mascot.svg">

	<script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
	<script defer src="./static/js/fontawesome.all.min.js"></script>
	<script src="./static/js/bulma-carousel.min.js"></script>
	<script src="./static/js/bulma-slider.min.js"></script>
	<script src="./static/js/index.js"></script>
	</head>
	<body>

	<nav class="navbar" role="navigation" aria-label="main navigation">
	<div class="navbar-brand">
	<a role="button" class="navbar-burger" aria-label="menu" aria-expanded="false">
	<span aria-hidden="true"></span>
	<span aria-hidden="true"></span>
	<span aria-hidden="true"></span>
	</a>
	</div>
	</nav>


	<section class="hero">
	<div class="hero-body">
	<div class="container is-max-desktop">
	<div class="columns is-centered">
	<div class="column has-text-centered">
	<h1 class="title is-1 publication-title">LEDITS++: Limitless Image Editing using Text-to-Image Models</h1>
	<div class="is-size-5 publication-authors">
	<span class="author-block">
	<a>Manuel Brack</a>,</span>
	<span class="author-block">
	<a>Linoy Tsaban</a>,</span>
	<span class="author-block">
	<a>Katharina Kornmeier</a>,</span>
	<span class="author-block">
	<a>Apolinário Passos</a>,</span>
	<p></p>
	<span class="author-block">
	<a>Felix Friedrich</a>,</span>
	<span class="author-block">
	<a>Patrick Schramowski</a>,</span>
	<span class="author-block">
	<a>Kristian Kersting</a></span>



	<div class="is-size-5 publication-authors">
	<span class="author-block">German Research Center for Artificial Intelligence (DFKI),</span>
	</div>
	<div class="is-size-5 publication-authors">
	<span class="author-block">Computer Science Department, TU Darmstadt,</span>
	</div>
	<div class="is-size-5 publication-authors">
	<span class="author-block">HuggingFace🤗,</span>
	</div>
	<div class="is-size-5 publication-authors">
	<span class="author-block">Hessian.AI,</span>
	</div>
	<div class="is-size-5 publication-authors">
	<span class="author-block">LAION,</span>
	</div>
	<div class="is-size-5 publication-authors">
	<span class="author-block">Centre for Cognitive Science, TU Darmstadt</span>
	</div>

	<div class="column has-text-centered">
	<div class="publication-links">
	<!-- arxiv Link. -->
	<!-- <span class="link-block">-->
	<!-- <a href=""-->
	<!-- class="external-link button is-normal is-rounded is-dark">-->
	<!-- <span class="icon">-->
	<!-- <i class="ai ai-arxiv"></i>-->
	<!-- </span>-->
	<!-- <span>arXiv</span>-->
	<!-- </a>-->
	<!-- </span>-->

	<!-- Demo Link. -->
	<span class="link-block">
	<a href="https://huggingface.co/spaces/editing-images/ledtisplusplus"
	class="external-link button is-normal is-rounded is-dark">

	<span>🤗 Demo</span>
	</a>
	</span>
	<!-- <!– Code Link. –>-->
	<!-- <span class="link-block">-->
	<!-- <a href=""-->
	<!-- class="external-link button is-normal is-rounded is-dark">-->
	<!-- <span class="icon">-->
	<!-- <i class="fa-github"></i>-->
	<!-- </span>-->
	<!-- <span>Code</span>-->
	<!-- </a>-->
	<!-- </span>-->

	</div>

	</div>
	</div>
	</div>
	</div>
	</div>
	</section>

	<section class="hero teaser">
	<div class="container is-max-desktop">
	<div class="hero-body">

	<video autoplay muted loop playsinline height="100%">
	<source src="static/videos/teaser_gif.mp4"
	type="video/mp4">
	</video>

	<h2 class="subtitle has-text-centered">
	Teaser GIF/image description
	</h2>

	</div>
	</div>
	</section>


	<section class="section">
	<div class="container is-max-desktop">
	<!-- Abstract. -->
	<div class="columns is-centered has-text-centered">
	<div class="column is-four-fifths">
	<h2 class="title is-3">Abstract</h2>
	<div class="content has-text-justified">
	<p>
	Text-to-image diffusion models have recently received a lot of interest for their
	astonishing ability to produce high-fidelity images from text only. Subsequent
	research efforts are aiming to exploit the capabilities of these models and leverage
	them for intuitive, textual image editing. However, existing methods often require
	time-consuming fine-tuning and lack native support for performing multiple edits
	simultaneously. To address these issues, we introduce LEDITS++ , an efficient yet
	versatile technique for image editing using text-to-image models. LEDITS++ re-
	quires no tuning nor optimization, runs in a few diffusion steps, natively supports
	multiple simultaneous edits, inherently limits changes to relevant image regions,
	and is architecture agnostic.
	</p>

	</div>
	</div>
	</div>

	</div>
	</section>

	<section class="section">
	<div class="container is-max-desktop">
	<div class="columns is-centered has-text-centered">
	<img src="static/images/teaser.png"
	class="interpolation-image"
	style="max-height:700px; max-width:1000px"
	alt="ledits++ teaser"/>
	</div>
	</div>
	</section>



	<section class="section">
	<div class="container is-max-desktop">
	<!-- Introduction -->
	<div class="columns is-centered has-text-centered">
	<h2 class="title is-3">LEDITS++: Efficient and Versatile Textual Image Editing</h2>
	</div>
	<div class="content has-text-justified">
	<p>
	To ease textual image editing, we present LEDITS++, a novel method for efficient and versatile image
	editing using text-to-image diffusion models. Firstly, LEDITS++ sets itself apart as a parameter-free
	solution requiring no fine-tuning nor any optimization. We derive characteristics of an edit-friendly
	noise space with a perfect input reconstruction, which were previously proposed for the DDPM
	sampling scheme, for a significantly faster multistep stochastic differential-equation (SDE)
	solver. This novel invertibility of the DPM-solver++ facilitates editing with LEDITS++ in as
	little as 20 total diffusion steps for inversion and inference combined.
	Moreover, LEDITS++ places a strong emphasis on semantic grounding to enhance the visual and
	contextual coherence of the edits. This ensures that changes are limited to the relevant regions in the
	image, preserving the original image’s fidelity as much as possible. LEDITS++ also provides users
	with the flexibility to combine multiple edits seamlessly, opening up new creative possibilities for
	intricate image manipulations. Finally, the approach is architecture-agnostic and compatible with any
	diffusion model, whether latent or pixel-based.
	</p>
	<section class="section">
	<div class="container is-max-desktop">
	<div class="columns is-centered has-text-centered">
	<img src="static/images/ledits_teaser.jpg"
	class="interpolation-image"
	style="max-height:800px; max-width:1200px"
	alt="examples"/>
	</div>
	</div>
	</section>
	<div class="columns is-centered has-text-centered">
	<h2 class="title is-3">Methodology
	</h2>
	</div>
	<p>
	The methodology of LEDITS++ can be broken down into three components: (1) efficient image
	inversion, (2) versatile textual editing, and (3) semantic grounding of image changes. More in-depth
	details and mathematical derivations of each component can be found in App
	</p>

	<div class="columns is-centered has-text-centered">
	<img src="static/images/diagram.jpg"
	style="max-height:620px; max-width:700px"
	alt="diagram"/>
	</div>

	</div>


	</div>
	</section>


	<section class="section">
	<div class="container is-max-desktop">
	<div class="column">


	<div class="columns is-centered">

	<!-- Editing workflows -->
	<div class="column">
	<div class="content">
	<h2 class="title is-4">Component 1: Image Inversion</h2>
	<p>

	</p>

	</div>
	</div>


	<div class="column">
	<h2 class="title is-4">Component 2: Textual Editing</h2>
	<div class="columns is-centered">
	<div class="column content">
	<p>

	</p>

	</div>

	</div>
	</div>

	<div class="column">
	<h2 class="title is-4">Component 3: Semantic Grounding</h2>
	<div class="columns is-centered">
	<div class="column content">
	<p>

	</p>

	</div>

	</div>
	</div>

	</div>
	</div>
	</div>

	</section>

	<!-- portraits video -->
	<!--<section class="hero teaser">-->
	<!-- <div class="container is-max-desktop">-->
	<!-- <div class="hero-body">-->
	<!-- <video id="portraits" autoplay muted loop playsinline height="100%">-->
	<!-- <source src="./static/videos/portraits.mp4"-->
	<!-- type="video/mp4">-->
	<!-- </video>-->
	<!-- <h2 class="subtitle has-text-centered">-->
	<!-- Gif/image description-->
	<!-- </h2>-->

	<!-- </div>-->
	<!-- </div>-->
	<!--</section>-->

	<!-- 3 key observations -->


	<section class="section" id="BibTeX">
	<div class="container is-max-desktop content">
	<h2 class="title">BibTeX</h2>
	<pre><code>@article{
	}</code></pre>
	</div>
	</section>


	<footer class="footer">
	<div class="container">
	<div class="columns is-centered">
	<div class="column is-8">
	<div class="content">
	<p>
	This website is licensed under a <a rel="license"
	href="http://creativecommons.org/licenses/by-sa/4.0/">Creative
	Commons Attribution-ShareAlike 4.0 International License</a>.
	</p>
	<p>
	This page was built using the source code of:
	<a rel="nerfies.github.io"
	href="https://github.com/nerfies/nerfies.github.io">nerfies.github.io</a>
	</p>
	</div>
	</div>
	</div>
	</div>
	</footer>

	</body>
	</html>