Spaces:

leditsplusplus
/

project

Running

App Files Files Community

Linoy Tsaban commited on Nov 28, 2023

Commit

f06d376

1 Parent(s): 0ba4738

Update index.html

Browse files

Files changed (1) hide show

index.html +120 -92

index.html CHANGED Viewed

@@ -27,19 +27,21 @@
     <script src="./static/js/bulma-slider.min.js"></script>
     <script src="./static/js/index.js"></script>
     <style>
-      .publication-links a{
-        color: white !important
-      }
-      @media only screen and (max-width: 900px) {
-          .columns {
-            overflow-y: scroll;
-          }
-      }
-      @media only screen and (min-width: 901px) {
-          .is-centered img{
-            width: 80vw !important
-          }
-      }
     </style>
 </head>
 <body>
@@ -56,12 +58,13 @@
 <section class="hero">
-   <div class="hero-body">
-   <div class="container is-max-desktop">
-      <div class="columns is-centered">
-         <div class="column has-text-centered">
-            <h1 class="title is-1 publication-title">LEDITS++: Limitless Image Editing using Text-to-Image Models</h1>
-            <div class="is-size-5 publication-authors">
                        <span class="author-block">
                                   <a href="https://scholar.google.com/citations?user=kJ9Abf8AAAAJ&hl=en">Manuel Brack</a>¹²,
                         </span>
@@ -84,7 +87,7 @@
                                   <a href="https://twitter.com/multimodalart">Apolinário Passos</a>⁴
                         </span>
                         <p></p>
                         <div class="is-size-5 publication-authors">
                             <span class="author-block">¹ German Research Center for Artificial Intelligence (DFKI),</span>
                             <span class="author-block">² Computer Science Department, TU Darmstadt,</span>
@@ -93,10 +96,10 @@
                             <span class="author-block">⁵ Centre for Cognitive Science, TU Darmstadt,</span>
                             <span class="author-block">⁶ LAION</span>
                         </div>
-               <div class="column has-text-centered">
-                  <div class="publication-links">
-                     <!-- arxiv Link. -->
-                     <span class="link-block">
                      <a href="#"
                         class="external-link button is-normal is-rounded is-dark">
                      <span class="icon">
@@ -105,16 +108,16 @@
                      <span>arXiv</span>
                      </a>
                      </span>
-                     <!-- Demo Link. -->
-                     <span class="link-block">
                      <a href="https://huggingface.co/spaces/editing-images/ledtisplusplus"
                         target="_blank"
                         class="external-link button is-normal is-rounded is-dark">
                      <span>&#129303; Demo</span>
                      </a>
                      </span>
-                     <!-- Code Link. -->
-                     <span class="link-block">
                      <a href="https://huggingface.co/spaces/editing-images/ledtisplusplus/tree/main"
                         target="_blank"
                         class="external-link button is-normal is-rounded is-dark">
@@ -124,12 +127,12 @@
                      <span>Code</span>
                      </a>
                      </span>
-                  </div>
-               </div>
             </div>
-         </div>
-      </div>
-   </div>
 </section>
 <section class="hero teaser">
@@ -140,10 +143,6 @@
                 <source src="static/videos/faces.mp4"
                         type="video/mp4">
             </video>
-            <video autoplay muted loop playsinline height="100%">
-                <source src="static/videos/objects_styles.mp4"
-                        type="video/mp4">
-            </video>
             <h2 class="subtitle has-text-centered">
@@ -193,10 +192,9 @@
 </section>
 <section class="section">
     <div class="container is-max-desktop">
- <!-- Introduction -->
         <div class="columns is-centered has-text-centered">
             <h2 class="title is-3">LEDITS++: Efficient and Versatile Textual Image Editing</h2>
         </div>
@@ -270,7 +268,9 @@
                         <p>
                             Utilizing T2I models for editing real images is usually done by inverting the sampling
                             process to identify a noisy xT that will be denoised to the input image x0.
-                            We draw characteristics from <a href="https://inbarhub.github.io/DDPM_inversion/" target="_blank">edit friendly DDPM inversion</a> and propose an efficient
                             inversion method that greatly reduces the required number
                             of steps while maintaining no reconstruction error.
                             DDPM can be viewed as a first-order
@@ -283,67 +283,95 @@
                         <img src="static/images/inversion.png"/>
                     </div>
                     <div class="content">
-                            <h2 class="title is-4">Component 2: Textual Editing</h2>
-                            <p>
-                                After creating our re-construction sequence, we can edit the image by manipulating
-                                the noise estimate εθ based on a set of edit instructions. We devise a dedicated
-                                guidance term for each concept based on conditioned and unconditioned estimate. We
-                                define LEDITS++ guidance such that it both reflects the direction of the edit (if we
-                                want
-                                to push away from/towards the edit concept) and maximizes fine-grained control over
-                                the effect of the desired edit.
-                            </p>
-                            <img src="static/images/textual_editing.png" />
-                        </div>
                     <div class="content">
-                            <h2 class="title is-4">Component 3: Semantic Grounding</h2>
-                            <p>
-                                In our defined LEDITS++ guidance, we include a masking term composed of the
-                                intersection between the mask generated from
-                                the U-Net’s cross-attention layers and a mask derived from
-                                the noise estimate - yielding a mask both focused on relevant image
-                                regions and of fine granularity.
-                                We empirically demonstrate that these maps can also capture regions
-                                of an image relevant to an editing concept that is not already present.
-                                Specifically for multiple edits, calculating a
-                                dedicated mask for each edit prompt ensures that the corresponding
-                                guidance terms remain largely isolated, limiting
-                                interference between them.
-                            </p>
                     </div>
                 </div>
             </div>
             <div class="columns is-centered has-text-centered">
-                        <img
-                          style="max-height:800px; max-width:800px"
-                          src="static/images/semantic_grounding.png"
-                        />
-                    </div>
         </div>
     </div>
 </section>
 <section class="section">
     <div class="container is-max-desktop">
-      <div class="columns is-centered has-text-centered">
-        <h2 class="title is-3">Interactive Demo</h2>
-      </div>
-      <script
-      	type="module"
-      	src="https://gradio.s3-us-west-2.amazonaws.com/3.43.0/gradio.js"
-      ></script>
-      <gradio-app src="https://editing-images-ledtisplusplus.hf.space"></gradio-app>
     </div>
 </section>
-                <!-- portraits video -->
 <!--<section class="hero teaser">-->
 <!--    <div class="container is-max-desktop">-->
 <!--        <div class="hero-body">-->
@@ -359,15 +387,15 @@
 <!--    </div>-->
 <!--</section>-->
-   <!-- 3 key observations -->
 <section class="section" id="BibTeX">
-  <div class="container is-max-desktop content">
-    <h2 class="title">BibTeX</h2>
-    <pre><code>@article{
 }</code></pre>
-  </div>
 </section>

     <script src="./static/js/bulma-slider.min.js"></script>
     <script src="./static/js/index.js"></script>
     <style>
+        .publication-links a {
+            color: white !important
+        }
+        @media only screen and (max-width: 900px) {
+            .columns {
+                overflow-y: scroll;
+            }
+        }
+        @media only screen and (min-width: 901px) {
+            .is-centered img {
+                width: 80vw !important
+            }
+        }
     </style>
 </head>
 <body>
 <section class="hero">
+    <div class="hero-body">
+        <div class="container is-max-desktop">
+            <div class="columns is-centered">
+                <div class="column has-text-centered">
+                    <h1 class="title is-1 publication-title">LEDITS++: Limitless Image Editing using Text-to-Image
+                        Models</h1>
+                    <div class="is-size-5 publication-authors">
                        <span class="author-block">
                                   <a href="https://scholar.google.com/citations?user=kJ9Abf8AAAAJ&hl=en">Manuel Brack</a>¹²,
                         </span>
                                   <a href="https://twitter.com/multimodalart">Apolinário Passos</a>⁴
                         </span>
                         <p></p>
                         <div class="is-size-5 publication-authors">
                             <span class="author-block">¹ German Research Center for Artificial Intelligence (DFKI),</span>
                             <span class="author-block">² Computer Science Department, TU Darmstadt,</span>
                             <span class="author-block">⁵ Centre for Cognitive Science, TU Darmstadt,</span>
                             <span class="author-block">⁶ LAION</span>
                         </div>
+                        <div class="column has-text-centered">
+                            <div class="publication-links">
+                                <!-- arxiv Link. -->
+                                <span class="link-block">
                      <a href="#"
                         class="external-link button is-normal is-rounded is-dark">
                      <span class="icon">
                      <span>arXiv</span>
                      </a>
                      </span>
+                                <!-- Demo Link. -->
+                                <span class="link-block">
                      <a href="https://huggingface.co/spaces/editing-images/ledtisplusplus"
                         target="_blank"
                         class="external-link button is-normal is-rounded is-dark">
                      <span>&#129303; Demo</span>
                      </a>
                      </span>
+                                <!-- Code Link. -->
+                                <span class="link-block">
                      <a href="https://huggingface.co/spaces/editing-images/ledtisplusplus/tree/main"
                         target="_blank"
                         class="external-link button is-normal is-rounded is-dark">
                      <span>Code</span>
                      </a>
                      </span>
+                            </div>
+                        </div>
+                    </div>
+                </div>
             </div>
+        </div>
 </section>
 <section class="hero teaser">
                 <source src="static/videos/faces.mp4"
                         type="video/mp4">
             </video>
             <h2 class="subtitle has-text-centered">
 </section>
 <section class="section">
     <div class="container is-max-desktop">
+        <!-- Introduction -->
         <div class="columns is-centered has-text-centered">
             <h2 class="title is-3">LEDITS++: Efficient and Versatile Textual Image Editing</h2>
         </div>
                         <p>
                             Utilizing T2I models for editing real images is usually done by inverting the sampling
                             process to identify a noisy xT that will be denoised to the input image x0.
+                            We draw characteristics from <a href="https://inbarhub.github.io/DDPM_inversion/"
+                                                            target="_blank">edit friendly DDPM inversion</a> and propose
+                            an efficient
                             inversion method that greatly reduces the required number
                             of steps while maintaining no reconstruction error.
                             DDPM can be viewed as a first-order
                         <img src="static/images/inversion.png"/>
                     </div>
                     <div class="content">
+                        <h2 class="title is-4">Component 2: Textual Editing</h2>
+                        <p>
+                            After creating our re-construction sequence, we can edit the image by manipulating
+                            the noise estimate εθ based on a set of edit instructions. We devise a dedicated
+                            guidance term for each concept based on conditioned and unconditioned estimate. We
+                            define LEDITS++ guidance such that it both reflects the direction of the edit (if we
+                            want
+                            to push away from/towards the edit concept) and maximizes fine-grained control over
+                            the effect of the desired edit.
+                        </p>
+                        <img src="static/images/textual_editing.png"/>
+                    </div>
                     <div class="content">
+                        <h2 class="title is-4">Component 3: Semantic Grounding</h2>
+                        <p>
+                            In our defined LEDITS++ guidance, we include a masking term composed of the
+                            intersection between the mask generated from
+                            the U-Net’s cross-attention layers and a mask derived from
+                            the noise estimate - yielding a mask both focused on relevant image
+                            regions and of fine granularity.
+                            We empirically demonstrate that these maps can also capture regions
+                            of an image relevant to an editing concept that is not already present.
+                            Specifically for multiple edits, calculating a
+                            dedicated mask for each edit prompt ensures that the corresponding
+                            guidance terms remain largely isolated, limiting
+                            interference between them.
+                        </p>
                     </div>
                 </div>
             </div>
             <div class="columns is-centered has-text-centered">
+                <img
+                        style="max-height:800px; max-width:800px"
+                        src="static/images/semantic_grounding.png"
+                />
+            </div>
+            <div class="columns is-centered has-text-centered">
+                <h2 class="title is-3">Properties if LEDITS++
+                </h2>
+            </div>
+            <div class="columns is-centered has-text-centered">
+                <div class="column">
+                    <p>
+                        Efficiency.
+                    </p>
+                </div>
+                <div class="column">
+                    <p>
+                        Versatility.
+                    </p>
+                </div>
+                <div class="column">
+                    <p>
+                        Precision.
+                    </p>
+                </div>
+            </div>
         </div>
+        <video autoplay muted loop playsinline height="100%">
+            <source src="static/videos/objects_styles.mp4"
+                    type="video/mp4">
+        </video>
     </div>
 </section>
 <section class="section">
     <div class="container is-max-desktop">
+        <div class="columns is-centered has-text-centered">
+            <h2 class="title is-3">Interactive Demo</h2>
+        </div>
+        <script
+                type="module"
+                src="https://gradio.s3-us-west-2.amazonaws.com/3.43.0/gradio.js"
+        ></script>
+        <gradio-app src="https://editing-images-ledtisplusplus.hf.space"></gradio-app>
     </div>
 </section>
+<!-- portraits video -->
 <!--<section class="hero teaser">-->
 <!--    <div class="container is-max-desktop">-->
 <!--        <div class="hero-body">-->
 <!--    </div>-->
 <!--</section>-->
+<!-- 3 key observations -->
 <section class="section" id="BibTeX">
+    <div class="container is-max-desktop content">
+        <h2 class="title">BibTeX</h2>
+        <pre><code>@article{
 }</code></pre>
+    </div>
 </section>