Spaces:

linoyts
/

Qwen-Image-Edit-next-scene

Running on Zero

App Files Files Community

linoyts HF Staff commited on 25 days ago

Commit

63c5b22

verified ·

1 Parent(s): 695bf10

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -13

app.py CHANGED Viewed

@@ -24,32 +24,54 @@ import time  # Added for history update delay
 from gradio_client import Client, handle_file
 import tempfile
-def turn_into_video(input_images, output_images, prompt):
     """Calls multimodalart/wan-2-2-first-last-frame space to generate a video."""
     if not input_images or not output_images:
-        raise gr.Error("Please generate at least one result first.")
-    # Take the first input and first output frame
-    start_img = input_images[0][0] if isinstance(input_images[0], tuple) else input_images[0]
-    end_img = output_images[0]
-    # Save them temporarily
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_start, \
          tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_end:
         start_img.save(tmp_start.name)
         end_img.save(tmp_end.name)
-        client = Client("multimodalart/wan-2-2-first-last-frame")
-        # Run inference on the remote space
         result = client.predict(
             start_image_pil={"image": handle_file(tmp_start.name)},
             end_image_pil={"image": handle_file(tmp_end.name)},
-            prompt=prompt or "generate smooth cinematic transition",
-            api_name="/generate_video"  # must match the remote Space’s API function name
         )
-    return result, gr.update(visible=True)
 SYSTEM_PROMPT = '''
@@ -650,9 +672,13 @@ with gr.Blocks(css=css) as demo:
     input_images.change(fn=suggest_next_scene_prompt, inputs=[input_images], outputs=[prompt])
     turn_video_btn.click(
-    fn=turn_into_video,
     inputs=[input_images, result, prompt],
-    outputs=[output_video, output_video],
 )

 from gradio_client import Client, handle_file
 import tempfile
+from PIL import Image
+import os
+import gradio as gr
+def turn_into_video(input_images, output_images, prompt, progress=gr.Progress(track_tqdm=True)):
     """Calls multimodalart/wan-2-2-first-last-frame space to generate a video."""
     if not input_images or not output_images:
+        raise gr.Error("Please generate an output image first.")
+    progress(0.02, desc="Preparing images...")
+    # Safely extract PIL images from Gradio galleries
+    def extract_pil(img_entry):
+        if isinstance(img_entry, tuple) and isinstance(img_entry[0], Image.Image):
+            return img_entry[0]
+        elif isinstance(img_entry, Image.Image):
+            return img_entry
+        elif isinstance(img_entry, str):
+            return Image.open(img_entry)
+        else:
+            raise gr.Error(f"Unsupported image format: {type(img_entry)}")
+    start_img = extract_pil(input_images[0])
+    end_img   = extract_pil(output_images[0])
+    progress(0.10, desc="Saving temp files...")
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_start, \
          tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_end:
         start_img.save(tmp_start.name)
         end_img.save(tmp_end.name)
+        progress(0.20, desc="Connecting to Wan space...")
+        client = Client("multimodalart/wan-2-2-first-last-frame")
+        progress(0.35, desc="generating video...")
         result = client.predict(
             start_image_pil={"image": handle_file(tmp_start.name)},
             end_image_pil={"image": handle_file(tmp_end.name)},
+            prompt=prompt or "smooth cinematic transition",
+            api_name="/generate_video"
         )
+    progress(0.95, desc="Finalizing...")
+    return result
 SYSTEM_PROMPT = '''
     input_images.change(fn=suggest_next_scene_prompt, inputs=[input_images], outputs=[prompt])
     turn_video_btn.click(
+    fn=lambda: gr.update(visible=True),
+    inputs=None,
+    outputs=[output_video],
+).then(
+    fn=turn_into_video,
     inputs=[input_images, result, prompt],
+    outputs=[output_video],
 )