Spaces:

prithivMLmods
/

DocScope-R1

Running on Zero

App Files Files Community

prithivMLmods commited on Apr 21

Commit

03b41ea

verified ·

1 Parent(s): ce44242

Update app.py

Browse files

Files changed (1) hide show

app.py +215 -193

app.py CHANGED Viewed

@@ -3,7 +3,8 @@ import spaces
 import torch
 from diffusers import AutoencoderKL, TCDScheduler
 from diffusers.models.model_loading_utils import load_state_dict
-# Removed: from gradio_imageslider import ImageSlider
 from huggingface_hub import hf_hub_download
 from controlnet_union import ControlNetModel_Union
@@ -12,7 +13,7 @@ from pipeline_fill_sd_xl import StableDiffusionXLFillPipeline
 from PIL import Image, ImageDraw
 import numpy as np
-# --- Model Loading (unchanged) ---
 config_file = hf_hub_download(
     "xinsir/controlnet-union-sdxl-1.0",
     filename="config_promax.json",
@@ -46,8 +47,7 @@ pipe = StableDiffusionXLFillPipeline.from_pretrained(
 pipe.scheduler = TCDScheduler.from_config(pipe.scheduler.config)
-# --- Helper Functions (unchanged, except infer) ---
 def can_expand(source_width, source_height, target_width, target_height, alignment):
     """Checks if the image can be expanded based on the alignment."""
     if alignment in ("Left", "Right") and source_width >= target_width:
@@ -129,28 +129,39 @@ def prepare_image_and_mask(image, width, height, overlap_percentage, resize_opti
     mask_draw = ImageDraw.Draw(mask)
     # Calculate overlap areas
-    white_gaps_patch = 2
     left_overlap = margin_x + overlap_x if overlap_left else margin_x + white_gaps_patch
     right_overlap = margin_x + new_width - overlap_x if overlap_right else margin_x + new_width - white_gaps_patch
     top_overlap = margin_y + overlap_y if overlap_top else margin_y + white_gaps_patch
     bottom_overlap = margin_y + new_height - overlap_y if overlap_bottom else margin_y + new_height - white_gaps_patch
     if alignment == "Left":
-        left_overlap = margin_x + overlap_x if overlap_left else margin_x
     elif alignment == "Right":
-        right_overlap = margin_x + new_width - overlap_x if overlap_right else margin_x + new_width
     elif alignment == "Top":
-        top_overlap = margin_y + overlap_y if overlap_top else margin_y
     elif alignment == "Bottom":
-        bottom_overlap = margin_y + new_height - overlap_y if overlap_bottom else margin_y + new_height
-    # Draw the mask
-    mask_draw.rectangle([
-        (left_overlap, top_overlap),
-        (right_overlap, bottom_overlap)
-    ], fill=0)
     return background, mask
@@ -160,15 +171,11 @@ def preview_image_and_mask(image, width, height, overlap_percentage, resize_opti
     # Create a preview image showing the mask
     preview = background.copy().convert('RGBA')
-    # Create a semi-transparent red overlay
-    red_overlay = Image.new('RGBA', background.size, (255, 0, 0, 64))  # Reduced alpha to 64 (25% opacity)
-    # Convert black pixels in the mask to semi-transparent red
-    red_mask = Image.new('RGBA', background.size, (0, 0, 0, 0))
-    red_mask.paste(red_overlay, (0, 0), mask)
-    # Overlay the red mask on the background
-    preview = Image.alpha_composite(preview, red_mask)
     return preview
@@ -176,22 +183,29 @@ def preview_image_and_mask(image, width, height, overlap_percentage, resize_opti
 def infer(image, width, height, overlap_percentage, num_inference_steps, resize_option, custom_resize_percentage, prompt_input, alignment, overlap_left, overlap_right, overlap_top, overlap_bottom):
     background, mask = prepare_image_and_mask(image, width, height, overlap_percentage, resize_option, custom_resize_percentage, alignment, overlap_left, overlap_right, overlap_top, overlap_bottom)
-    if not can_expand(background.width, background.height, width, height, alignment):
-        alignment = "Middle" # Default to middle if expansion not possible with current alignment
     cnet_image = background.copy()
-    # Prepare the controlnet input image (original image with blacked-out mask area)
-    # Note: The pipeline expects the original image content where the mask is 0 (black)
-    # and the area to be filled where the mask is 255 (white).
-    # However, the current pipeline_fill_sd_xl seems to use the mask differently internally.
-    # Let's prepare the input image as per the original logic, which pastes black over the masked area.
-    black_fill = Image.new('RGB', cnet_image.size, (0, 0, 0))
-    # Invert the mask: white (255) becomes the area to keep, black (0) the area to fill
-    inverted_mask = Image.eval(mask, lambda x: 255 - x)
-    cnet_image.paste(black_fill, (0, 0), inverted_mask) # Paste black where the inverted mask is white (original mask was 0)
-    final_prompt = f"{prompt_input} , high quality, 4k"
     (
         prompt_embeds,
@@ -200,62 +214,57 @@ def infer(image, width, height, overlap_percentage, num_inference_steps, resize_
         negative_pooled_prompt_embeds,
     ) = pipe.encode_prompt(final_prompt, "cuda", True)
-    # Generate the image content for the masked area
-    # The pipeline yields the generated content for the masked area
-    # We only need the final result from the generator
-    generated_content = None
-    for res in pipe(
         prompt_embeds=prompt_embeds,
         negative_prompt_embeds=negative_prompt_embeds,
         pooled_prompt_embeds=pooled_prompt_embeds,
         negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
-        image=cnet_image, # Pass the image with blacked-out area
-        mask_image=mask, # Pass the mask (white = area to fill)
-        num_inference_steps=num_inference_steps
-    ):
-        generated_content = res # Keep updating until the last step
-    # The pipeline directly returns the final composite image in recent versions
-    # If it returns only the filled part, we need to composite it
-    # Let's assume the pipeline returns the final composited image based on its name "FillPipeline"
-    final_image = generated_content
-    # --- OLD compositing logic (keep commented in case pipeline behavior differs) ---
-    # # Convert generated content to RGBA to handle potential transparency
-    # generated_content = generated_content.convert("RGBA")
-    # # Create the final composite image by pasting the generated content onto the background
-    # final_image = background.copy().convert("RGBA")
-    # # Paste the generated content using the original mask (white area = where to paste)
-    # final_image.paste(generated_content, (0, 0), mask)
-    # final_image = final_image.convert("RGB") # Convert back to RGB if needed
-    # Yield only the final composited image
-    yield final_image
 def clear_result():
-    """Clears the result Image."""
     return gr.update(value=None)
 def preload_presets(target_ratio, ui_width, ui_height):
     """Updates the width and height sliders based on the selected aspect ratio."""
     if target_ratio == "9:16":
         changed_width = 720
         changed_height = 1280
-        return changed_width, changed_height, gr.update()
     elif target_ratio == "16:9":
         changed_width = 1280
         changed_height = 720
-        return changed_width, changed_height, gr.update()
     elif target_ratio == "1:1":
         changed_width = 1024
         changed_height = 1024
-        return changed_width, changed_height, gr.update()
     elif target_ratio == "Custom":
-        # When switching to custom, keep current slider values but open the accordion
         return ui_width, ui_height, gr.update(open=True)
 def select_the_right_preset(user_width, user_height):
     if user_width == 720 and user_height == 1280:
         return "9:16"
     elif user_width == 1280 and user_height == 720:
@@ -266,53 +275,65 @@ def select_the_right_preset(user_width, user_height):
         return "Custom"
 def toggle_custom_resize_slider(resize_option):
     return gr.update(visible=(resize_option == "Custom"))
 def update_history(new_image, history):
     """Updates the history gallery with the new image."""
     if history is None:
         history = []
-    # Ensure new_image is a PIL Image before inserting
     if isinstance(new_image, Image.Image):
         history.insert(0, new_image)
-    # Handle cases where the input might be None or not an image (e.g., during clearing)
-    elif new_image is not None:
-        print(f"Warning: Attempted to add non-image type to history: {type(new_image)}")
     return history
-# --- Gradio UI ---
 css = """
 .gradio-container {
     width: 1200px !important;
 }
 h1 { text-align: center; }
 footer { visibility: hidden; }
-"""
-title = """<h1 align="center">Diffusers Image Outpaint Lightning</h1>
 """
 with gr.Blocks(css=css) as demo:
     with gr.Column():
         gr.HTML(title)
         with gr.Row():
-            with gr.Column():
                 input_image = gr.Image(
                     type="pil",
-                    label="Input Image"
                 )
                 with gr.Row():
                     with gr.Column(scale=2):
-                        prompt_input = gr.Textbox(label="Prompt (Optional)")
                     with gr.Column(scale=1):
-                        run_button = gr.Button("Generate")
                 with gr.Row():
                     target_ratio = gr.Radio(
-                        label="Expected Ratio",
                         choices=["9:16", "16:9", "1:1", "Custom"],
                         value="9:16",
                         scale=2
@@ -321,130 +342,123 @@ with gr.Blocks(css=css) as demo:
                     alignment_dropdown = gr.Dropdown(
                         choices=["Middle", "Left", "Right", "Top", "Bottom"],
                         value="Middle",
-                        label="Alignment"
                     )
                 with gr.Accordion(label="Advanced settings", open=False) as settings_panel:
-                    with gr.Column():
-                        with gr.Row():
-                            width_slider = gr.Slider(
-                                label="Target Width",
-                                minimum=720,
-                                maximum=1536,
-                                step=8,
-                                value=720,  # Default for 9:16
-                            )
-                            height_slider = gr.Slider(
-                                label="Target Height",
-                                minimum=720,
-                                maximum=1536,
-                                step=8,
-                                value=1280, # Default for 9:16
-                            )
-                        num_inference_steps = gr.Slider(label="Steps", minimum=4, maximum=12, step=1, value=8)
-                        with gr.Group():
-                            overlap_percentage = gr.Slider(
-                                label="Mask overlap (%)",
-                                minimum=1,
-                                maximum=50,
-                                value=10,
-                                step=1
-                            )
-                            with gr.Row():
-                                overlap_top = gr.Checkbox(label="Overlap Top", value=True)
-                                overlap_right = gr.Checkbox(label="Overlap Right", value=True)
-                            with gr.Row(): # Changed nesting for better layout
-                                overlap_left = gr.Checkbox(label="Overlap Left", value=True)
-                                overlap_bottom = gr.Checkbox(label="Overlap Bottom", value=True)
                         with gr.Row():
-                            resize_option = gr.Radio(
-                                label="Resize input image",
-                                choices=["Full", "50%", "33%", "25%", "Custom"],
-                                value="Full"
-                            )
-                            custom_resize_percentage = gr.Slider(
-                                label="Custom resize (%)",
-                                minimum=1,
-                                maximum=100,
-                                step=1,
-                                value=50,
-                                visible=False
-                            )
-                        with gr.Column(): # Keep preview button separate
-                            preview_button = gr.Button("Preview alignment and mask")
                 gr.Examples(
                     examples=[
-                        ["./examples/example_1.webp", 1280, 720, "Middle"],
-                        ["./examples/example_2.jpg", 1440, 810, "Left"],
-                        ["./examples/example_3.jpg", 1024, 1024, "Top"],
-                        ["./examples/example_3.jpg", 1024, 1024, "Bottom"],
                     ],
-                    inputs=[input_image, width_slider, height_slider, alignment_dropdown],
-                     # Ensure examples don't try to set output components directly
-                     # outputs=[result], # Remove output mapping from examples
-                     # fn=infer, # Don't run infer on example click, just load inputs
                 )
-            with gr.Column():
-                # *** MODIFICATION: Changed ImageSlider to Image ***
-                result = gr.Image(label="Generated Image", interactive=False, type="pil")
-                use_as_input_button = gr.Button("Use as Input Image", visible=False)
-                history_gallery = gr.Gallery(label="History", columns=6, object_fit="contain", interactive=False, type="pil")
-                preview_image = gr.Image(label="Preview", type="pil") # Ensure preview is also PIL
-    # --- Event Handlers ---
     def use_output_as_input(output_image):
         """Sets the generated output as the new input image."""
-        # *** MODIFICATION: Access the image directly, not output_image[1] ***
         return gr.update(value=output_image)
     use_as_input_button.click(
         fn=use_output_as_input,
-        inputs=[result], # Input is the single result image
-        outputs=[input_image]
     )
     target_ratio.change(
         fn=preload_presets,
         inputs=[target_ratio, width_slider, height_slider],
-        outputs=[width_slider, height_slider, settings_panel],
         queue=False
     )
-    # Link sliders change to update the ratio selection to "Custom"
     width_slider.change(
         fn=select_the_right_preset,
         inputs=[width_slider, height_slider],
         outputs=[target_ratio],
         queue=False
-    ).then(
-        fn=lambda: gr.update(open=True), # Also open accordion on slider change
-        inputs=None,
-        outputs=settings_panel,
-        queue=False
     )
     height_slider.change(
         fn=select_the_right_preset,
         inputs=[width_slider, height_slider],
         outputs=[target_ratio],
         queue=False
-    ).then(
-        fn=lambda: gr.update(open=True), # Also open accordion on slider change
-        inputs=None,
-        outputs=settings_panel,
-        queue=False
     )
     resize_option.change(
         fn=toggle_custom_resize_slider,
         inputs=[resize_option],
@@ -452,49 +466,58 @@ with gr.Blocks(css=css) as demo:
         queue=False
     )
-    # Combine run logic for Button and Textbox submission
-    run_inputs = [
         input_image, width_slider, height_slider, overlap_percentage, num_inference_steps,
         resize_option, custom_resize_percentage, prompt_input, alignment_dropdown,
         overlap_left, overlap_right, overlap_top, overlap_bottom
     ]
-    def run_generation(img, w, h, ov_perc, steps, res_opt, cust_res_perc, prompt, align, ov_l, ov_r, ov_t, ov_b, history):
-        # The infer function is a generator, we need to iterate to get the final value
-        final_image = None
-        for res_img in infer(img, w, h, ov_perc, steps, res_opt, cust_res_perc, prompt, align, ov_l, ov_r, ov_t, ov_b):
-            final_image = res_img
-        # Update history with the final image
-        updated_history = update_history(final_image, history)
-        # Return the final image for the result component and the updated history
-        return final_image, updated_history, gr.update(visible=True) # Also make button visible
     run_button.click(
-        fn=clear_result, # First clear the previous result
         inputs=None,
-        outputs=result,
-        queue=False # Clearing should be fast
     ).then(
-        fn=run_generation, # Then run the generation and history update
-        inputs=run_inputs + [history_gallery], # Pass current history
-        outputs=[result, history_gallery, use_as_input_button], # Update result, history, and button visibility
     )
     prompt_input.submit(
-        fn=clear_result, # First clear the previous result
         inputs=None,
-        outputs=result,
-        queue=False # Clearing should be fast
     ).then(
-        fn=run_generation, # Then run the generation and history update
-        inputs=run_inputs + [history_gallery], # Pass current history
-        outputs=[result, history_gallery, use_as_input_button], # Update result, history, and button visibility
     )
     preview_button.click(
         fn=preview_image_and_mask,
         inputs=[input_image, width_slider, height_slider, overlap_percentage, resize_option, custom_resize_percentage, alignment_dropdown,
@@ -503,5 +526,4 @@ with gr.Blocks(css=css) as demo:
         queue=False # Preview should be fast
     )
-# Launch the demo
-demo.queue(max_size=20).launch(share=False, ssr_mode=False, show_error=True)

 import torch
 from diffusers import AutoencoderKL, TCDScheduler
 from diffusers.models.model_loading_utils import load_state_dict
+# Remove ImageSlider import
+# from gradio_imageslider import ImageSlider
 from huggingface_hub import hf_hub_download
 from controlnet_union import ControlNetModel_Union
 from PIL import Image, ImageDraw
 import numpy as np
+# --- Model Loading (Unchanged) ---
 config_file = hf_hub_download(
     "xinsir/controlnet-union-sdxl-1.0",
     filename="config_promax.json",
 pipe.scheduler = TCDScheduler.from_config(pipe.scheduler.config)
+# --- Helper Functions (Mostly Unchanged) ---
 def can_expand(source_width, source_height, target_width, target_height, alignment):
     """Checks if the image can be expanded based on the alignment."""
     if alignment in ("Left", "Right") and source_width >= target_width:
     mask_draw = ImageDraw.Draw(mask)
     # Calculate overlap areas
+    white_gaps_patch = 2 # Pixels to leave unmasked at edges if overlap is disabled for that edge
     left_overlap = margin_x + overlap_x if overlap_left else margin_x + white_gaps_patch
     right_overlap = margin_x + new_width - overlap_x if overlap_right else margin_x + new_width - white_gaps_patch
     top_overlap = margin_y + overlap_y if overlap_top else margin_y + white_gaps_patch
     bottom_overlap = margin_y + new_height - overlap_y if overlap_bottom else margin_y + new_height - white_gaps_patch
+    # Adjust overlap boundaries based on alignment when specific overlap directions are *disabled*
+    # This prevents unmasking the absolute edge of the canvas in alignment modes
     if alignment == "Left":
+        left_overlap = margin_x + overlap_x if overlap_left else margin_x # Keep edge masked if alignment is left
     elif alignment == "Right":
+        right_overlap = margin_x + new_width - overlap_x if overlap_right else margin_x + new_width # Keep edge masked
     elif alignment == "Top":
+        top_overlap = margin_y + overlap_y if overlap_top else margin_y # Keep edge masked
     elif alignment == "Bottom":
+        bottom_overlap = margin_y + new_height - overlap_y if overlap_bottom else margin_y + new_height # Keep edge masked
+    # Ensure coordinates are within bounds
+    left_overlap = max(0, left_overlap)
+    top_overlap = max(0, top_overlap)
+    right_overlap = min(target_size[0], right_overlap)
+    bottom_overlap = min(target_size[1], bottom_overlap)
+    # Draw the mask (black rectangle for the area to keep)
+    if right_overlap > left_overlap and bottom_overlap > top_overlap:
+        mask_draw.rectangle([
+            (left_overlap, top_overlap),
+            (right_overlap, bottom_overlap)
+        ], fill=0) # 0 means keep this area (not masked for inpainting)
+    # Invert the mask: White areas (255) will be inpainted. Black (0) is kept.
+    mask = Image.fromarray(255 - np.array(mask))
     return background, mask
     # Create a preview image showing the mask
     preview = background.copy().convert('RGBA')
+    # Create a semi-transparent red overlay for the masked (inpainting) area
+    red_overlay = Image.new('RGBA', background.size, (255, 0, 0, 100)) # 100 alpha (~40% opacity)
+    # The mask is now white (255) where inpainting happens. Use this directly.
+    preview.paste(red_overlay, (0, 0), mask)
     return preview
 def infer(image, width, height, overlap_percentage, num_inference_steps, resize_option, custom_resize_percentage, prompt_input, alignment, overlap_left, overlap_right, overlap_top, overlap_bottom):
     background, mask = prepare_image_and_mask(image, width, height, overlap_percentage, resize_option, custom_resize_percentage, alignment, overlap_left, overlap_right, overlap_top, overlap_bottom)
+    # Ensure alignment allows expansion, default to Middle if not
+    source_w, source_h = background.size # Use background size after initial resize/placement
+    target_w, target_h = width, height
+    if alignment in ("Left", "Right") and source_w >= target_w:
+        print(f"Warning: Source width ({source_w}) >= target width ({target_w}) with {alignment} alignment. Forcing Middle alignment.")
+        alignment = "Middle"
+        # Re-prepare mask/background with corrected alignment if needed (optional, depends if prepare func uses alignment early)
+        # background, mask = prepare_image_and_mask(...) # If needed
+    if alignment in ("Top", "Bottom") and source_h >= target_h:
+        print(f"Warning: Source height ({source_h}) >= target height ({target_h}) with {alignment} alignment. Forcing Middle alignment.")
+        alignment = "Middle"
+        # Re-prepare mask/background with corrected alignment if needed
+        # background, mask = prepare_image_and_mask(...) # If needed
+    # Image for ControlNet input (masked original content)
+    # The pipeline expects the original image content in the non-masked area
     cnet_image = background.copy()
+    # The pipeline's `image` argument is the *initial* content for the *masked* area (often noise, but here we provide the background)
+    # The `mask_image` tells the pipeline *where* to perform the inpainting/outpainting.
+    # The controlnet `image` needs the original content visible in the non-masked area.
+    # ControlNet Union seems to work well by just passing the background with the source image pasted.
+    final_prompt = f"{prompt_input} , high quality, 4k" if prompt_input else "high quality, 4k"
     (
         prompt_embeds,
         negative_pooled_prompt_embeds,
     ) = pipe.encode_prompt(final_prompt, "cuda", True)
+    # The pipeline call
+    # Note: The pipeline expects `image` (initial state for masked area) and `mask_image`
+    # The `control_image` is implicitly handled by the ControlNet attached to the pipeline
+    output_image = pipe(
         prompt_embeds=prompt_embeds,
         negative_prompt_embeds=negative_prompt_embeds,
         pooled_prompt_embeds=pooled_prompt_embeds,
         negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
+        image=background, # Provide the initial canvas state
+        mask_image=mask,   # Provide the mask (white is area to change)
+        control_image=cnet_image, # Pass the control image explicitly if needed by pipeline logic
+        num_inference_steps=num_inference_steps,
+        output_type="pil" # Ensure PIL output
+    ).images[0]
+    # The pipeline should have already handled the compositing based on the mask
+    # If not, uncomment the paste operation below:
+    # final_image = background.copy().convert("RGBA") # Start with original background
+    # output_image = output_image.convert("RGBA")
+    # mask_rgba = mask.convert('L').point(lambda p: 255 if p > 128 else 0) # Ensure mask is binary 0/255
+    # final_image.paste(output_image, (0, 0), mask_rgba) # Paste generated content using the mask
+    # Return the single final image
+    return output_image
 def clear_result():
+    """Clears the result Image component."""
     return gr.update(value=None)
+# --- UI Helper Functions (Unchanged) ---
 def preload_presets(target_ratio, ui_width, ui_height):
     """Updates the width and height sliders based on the selected aspect ratio."""
     if target_ratio == "9:16":
         changed_width = 720
         changed_height = 1280
+        return changed_width, changed_height, gr.update() # Close accordion
     elif target_ratio == "16:9":
         changed_width = 1280
         changed_height = 720
+        return changed_width, changed_height, gr.update() # Close accordion
     elif target_ratio == "1:1":
         changed_width = 1024
         changed_height = 1024
+        return changed_width, changed_height, gr.update() # Close accordion
     elif target_ratio == "Custom":
+        # Don't change sliders, just open accordion
         return ui_width, ui_height, gr.update(open=True)
 def select_the_right_preset(user_width, user_height):
+    """Updates the radio button based on the current slider values."""
     if user_width == 720 and user_height == 1280:
         return "9:16"
     elif user_width == 1280 and user_height == 720:
         return "Custom"
 def toggle_custom_resize_slider(resize_option):
+    """Shows/hides the custom resize slider."""
     return gr.update(visible=(resize_option == "Custom"))
 def update_history(new_image, history):
     """Updates the history gallery with the new image."""
     if history is None:
         history = []
+    # Ensure new_image is a PIL Image before adding
     if isinstance(new_image, Image.Image):
         history.insert(0, new_image)
     return history
+# --- Gradio UI Definition ---
 css = """
 .gradio-container {
     width: 1200px !important;
+    margin: auto !important; /* Center the container */
 }
 h1 { text-align: center; }
 footer { visibility: hidden; }
+/* Ensure result image takes reasonable space */
+#result-image img {
+    max-height: 768px; /* Adjust max height as needed */
+    object-fit: contain;
+    width: auto;
+    height: auto;
+}
+#history-gallery .thumbnail-item { /* Style history items */
+    height: 100px !important;
+}
+#history-gallery .gallery {
+    grid-template-rows: repeat(auto-fill, 100px) !important;
+}
 """
+title = """<h1 align="center">Diffusers Image Outpaint Lightning</h1>"""
 with gr.Blocks(css=css) as demo:
     with gr.Column():
         gr.HTML(title)
         with gr.Row():
+            with gr.Column(scale=1): # Left column for inputs
                 input_image = gr.Image(
                     type="pil",
+                    label="Input Image",
+                    height=400 # Give input image reasonable height
                 )
                 with gr.Row():
                     with gr.Column(scale=2):
+                        prompt_input = gr.Textbox(label="Prompt (Optional)", placeholder="Describe the scene to expand...")
                     with gr.Column(scale=1):
+                        run_button = gr.Button("Generate", variant="primary") # Make primary
                 with gr.Row():
                     target_ratio = gr.Radio(
+                        label="Target Ratio",
                         choices=["9:16", "16:9", "1:1", "Custom"],
                         value="9:16",
                         scale=2
                     alignment_dropdown = gr.Dropdown(
                         choices=["Middle", "Left", "Right", "Top", "Bottom"],
                         value="Middle",
+                        label="Align Source Image"
                     )
                 with gr.Accordion(label="Advanced settings", open=False) as settings_panel:
+                    with gr.Row():
+                         width_slider = gr.Slider(
+                             label="Target Width",
+                             minimum=512, # Lowered minimum slightly
+                             maximum=2048, # Increased maximum slightly
+                             step=64, # Use steps of 64 common for SD
+                             value=720,
+                         )
+                         height_slider = gr.Slider(
+                             label="Target Height",
+                             minimum=512,
+                             maximum=2048,
+                             step=64,
+                             value=1280,
+                         )
+                    num_inference_steps = gr.Slider(label="Steps", minimum=1, maximum=12, step=1, value=4) # TCD/Lightning allows few steps
+                    with gr.Group():
+                        overlap_percentage = gr.Slider(
+                            label="Mask overlap (%)",
+                            minimum=1,
+                            maximum=50,
+                            value=12, # Default overlap
+                            step=1
+                        )
                         with gr.Row():
+                            overlap_top = gr.Checkbox(label="Top", value=True)
+                            overlap_right = gr.Checkbox(label="Right", value=True)
+                            overlap_bottom = gr.Checkbox(label="Bottom", value=True)
+                            overlap_left = gr.Checkbox(label="Left", value=True)
+                    with gr.Row():
+                        resize_option = gr.Radio(
+                            label="Resize input within target",
+                            choices=["Full", "50%", "33%", "25%", "Custom"],
+                            value="Full"
+                        )
+                        custom_resize_percentage = gr.Slider(
+                            label="Custom resize (%)",
+                            minimum=1,
+                            maximum=100,
+                            step=1,
+                            value=50,
+                            visible=False # Initially hidden
+                        )
+                    preview_button = gr.Button("Preview Mask & Alignment")
+                    preview_image = gr.Image(label="Mask Preview (Red = Outpaint Area)", type="pil", interactive=False)
                 gr.Examples(
                     examples=[
+                        ["./examples/example_1.webp", "A wide landscape view of the mountains", 1280, 720, "Middle"],
+                        ["./examples/example_2.jpg", "Full body shot of the astronaut on the moon", 720, 1280, "Middle"],
+                        ["./examples/example_3.jpg", "Expanding the sky and ground around the subject", 1024, 1024, "Middle"],
+                         ["./examples/example_3.jpg", "Expanding downwards from the subject", 1024, 1024, "Top"], # Align subject Top
+                         ["./examples/example_3.jpg", "Expanding upwards from the subject", 1024, 1024, "Bottom"], # Align subject Bottom
                     ],
+                    inputs=[input_image, prompt_input, width_slider, height_slider, alignment_dropdown],
+                    label="Examples (Click to load)"
                 )
+            with gr.Column(scale=1): # Right column for output
+                # Replace ImageSlider with gr.Image
+                result = gr.Image(label="Generated Image", type="pil", interactive=False, elem_id="result-image")
+                use_as_input_button = gr.Button("Use Result as Input Image", visible=False) # Initially hidden
+                history_gallery = gr.Gallery(
+                    label="History",
+                    columns=6,
+                    object_fit="contain",
+                    interactive=False,
+                    height=110, # Fixed height for the row
+                    elem_id="history-gallery"
+                )
+    # --- Event Handling ---
     def use_output_as_input(output_image):
         """Sets the generated output as the new input image."""
+        # output_image is now the single final image from gr.Image
         return gr.update(value=output_image)
     use_as_input_button.click(
         fn=use_output_as_input,
+        inputs=[result], # Input is the result image component
+        outputs=[input_image] # Output updates the input image component
     )
     target_ratio.change(
         fn=preload_presets,
         inputs=[target_ratio, width_slider, height_slider],
+        outputs=[width_slider, height_slider, settings_panel], # Also control accordion state
         queue=False
     )
+    # Link sliders back to the ratio selector
     width_slider.change(
         fn=select_the_right_preset,
         inputs=[width_slider, height_slider],
         outputs=[target_ratio],
         queue=False
     )
     height_slider.change(
         fn=select_the_right_preset,
         inputs=[width_slider, height_slider],
         outputs=[target_ratio],
         queue=False
     )
     resize_option.change(
         fn=toggle_custom_resize_slider,
         inputs=[resize_option],
         queue=False
     )
+    # Consolidate common inputs for generation
+    gen_inputs = [
         input_image, width_slider, height_slider, overlap_percentage, num_inference_steps,
         resize_option, custom_resize_percentage, prompt_input, alignment_dropdown,
         overlap_left, overlap_right, overlap_top, overlap_bottom
     ]
+    # Chain generation logic
     run_button.click(
+        fn=clear_result,
         inputs=None,
+        outputs=[result], # Clear the single image output
+        queue=False # Run clearing immediately
     ).then(
+        fn=infer,
+        inputs=gen_inputs,
+        outputs=[result], # Output the single image to the result component
+    ).then(
+        # Update history with the single result image
+        fn=lambda res_img, hist: update_history(res_img, hist),
+        inputs=[result, history_gallery],
+        outputs=[history_gallery],
+        queue=False # Update history immediately after generation
+    ).then(
+        # Show the 'Use as Input' button
+        fn=lambda: gr.update(visible=True),
+        inputs=None,
+        outputs=[use_as_input_button],
+        queue=False # Show button immediately
     )
     prompt_input.submit(
+         fn=clear_result,
         inputs=None,
+        outputs=[result],
+        queue=False
+    ).then(
+        fn=infer,
+        inputs=gen_inputs,
+        outputs=[result],
     ).then(
+        fn=lambda res_img, hist: update_history(res_img, hist),
+        inputs=[result, history_gallery],
+        outputs=[history_gallery],
+         queue=False
+    ).then(
+        fn=lambda: gr.update(visible=True),
+        inputs=None,
+        outputs=[use_as_input_button],
+        queue=False
     )
     preview_button.click(
         fn=preview_image_and_mask,
         inputs=[input_image, width_slider, height_slider, overlap_percentage, resize_option, custom_resize_percentage, alignment_dropdown,
         queue=False # Preview should be fast
     )
+demo.queue(max_size=10).launch(ssr_mode=False, show_error=True) # Removed share=False for potential Hugging Face Spaces use