Spaces:

Tonic
/

l-operator-demo

Running on Zero

App Files Files Community

Joseph Pollack commited on Aug 27

Commit

b7cacdf

unverified ·

1 Parent(s): f4bce3e

adds model loading and removes deprecated messages format

Browse files

Files changed (1) hide show

app.py +44 -14

app.py CHANGED Viewed

@@ -126,13 +126,13 @@ class LOperatorDemo:
             return f"❌ Error generating action: {str(e)}"
     @spaces.GPU(duration=90)  # 1.5 minutes for chat responses
-    def chat_with_model(self, message: str, history: List[List[str]], image: Image.Image = None) -> tuple:
         """Chat interface function for Gradio"""
         if not self.is_loaded:
-            return history + [[message, "❌ Model not loaded. Please load the model first."]]
         if image is None:
-            return history + [[message, "❌ Please upload an Android screenshot image."]]
         try:
             # Extract goal and instruction from message
@@ -149,7 +149,7 @@ class LOperatorDemo:
                         instruction = line.replace("Step:", "").strip()
                 if not goal or not instruction:
-                    return history + [[message, "❌ Please provide both Goal and Step in your message."]]
             else:
                 # Treat as general instruction
                 goal = "Complete the requested action"
@@ -157,15 +157,32 @@ class LOperatorDemo:
             # Generate action
             response = self.generate_action(image, goal, instruction)
-            return history + [[message, response]]
         except Exception as e:
             logger.error(f"Error in chat: {str(e)}")
-            return history + [[message, f"❌ Error: {str(e)}"]]
 # Initialize demo
 demo_instance = LOperatorDemo()
 # Load example episodes
 def load_example_episodes():
     """Load example episodes from the extracted data"""
@@ -233,7 +250,7 @@ def create_demo():
         ## 🚀 How to Use
-        1. **Load the Model**: Click the "Load Model" button to initialize the L-Operator model
         2. **Upload Screenshot**: Upload an Android device screenshot
         3. **Provide Instructions**: Enter your goal and step instructions
         4. **Get Actions**: The model will generate JSON actions for Android device control
@@ -257,6 +274,13 @@ def create_demo():
         with gr.Row():
             with gr.Column(scale=1):
                 gr.Markdown("### 📱 Input")
                 image_input = gr.Image(
                     label="Android Screenshot",
@@ -288,6 +312,7 @@ def create_demo():
                     title="L-Operator Chat",
                     description="Chat with L-Operator using screenshots and text instructions",
                     examples=load_example_episodes(),
                 )
                 gr.Markdown("### 🎯 Action Output")
@@ -298,9 +323,6 @@ def create_demo():
                 )
         # Event handlers
-        def on_load_model():
-            return demo_instance.load_model()
         def on_generate_action(image, goal, step):
             if not image:
                 return {"error": "Please upload an image"}
@@ -317,10 +339,12 @@ def create_demo():
             except:
                 return {"raw_response": response}
-        load_btn.click(
-            fn=on_load_model,
-            outputs=load_status
-        )
         generate_btn.click(
             fn=on_generate_action,
@@ -328,6 +352,12 @@ def create_demo():
             outputs=action_output
         )
         # Update chat interface when image changes
         def update_chat_image(image):
             return image

             return f"❌ Error generating action: {str(e)}"
     @spaces.GPU(duration=90)  # 1.5 minutes for chat responses
+    def chat_with_model(self, message: str, history: List[Dict[str, str]], image: Image.Image = None) -> List[Dict[str, str]]:
         """Chat interface function for Gradio"""
         if not self.is_loaded:
+            return history + [{"role": "user", "content": message}, {"role": "assistant", "content": "❌ Model not loaded. Please load the model first."}]
         if image is None:
+            return history + [{"role": "user", "content": message}, {"role": "assistant", "content": "❌ Please upload an Android screenshot image."}]
         try:
             # Extract goal and instruction from message
                         instruction = line.replace("Step:", "").strip()
                 if not goal or not instruction:
+                    return history + [{"role": "user", "content": message}, {"role": "assistant", "content": "❌ Please provide both Goal and Step in your message."}]
             else:
                 # Treat as general instruction
                 goal = "Complete the requested action"
             # Generate action
             response = self.generate_action(image, goal, instruction)
+            return history + [{"role": "user", "content": message}, {"role": "assistant", "content": response}]
         except Exception as e:
             logger.error(f"Error in chat: {str(e)}")
+            return history + [{"role": "user", "content": message}, {"role": "assistant", "content": f"❌ Error: {str(e)}"}]
 # Initialize demo
 demo_instance = LOperatorDemo()
+# Auto-load the model on startup
+def auto_load_model():
+    """Auto-load the model when the application starts"""
+    try:
+        logger.info("Auto-loading L-Operator model on startup...")
+        result = demo_instance.load_model()
+        logger.info(f"Auto-load result: {result}")
+        return result
+    except Exception as e:
+        logger.error(f"Error auto-loading model: {str(e)}")
+        return f"❌ Error auto-loading model: {str(e)}"
+# Load model automatically (this happens during import)
+print("🚀 Auto-loading L-Operator model on startup...")
+auto_load_model()
+print("✅ Model loading completed!")
 # Load example episodes
 def load_example_episodes():
     """Load example episodes from the extracted data"""
         ## 🚀 How to Use
+        1. **Model Loading**: The L-Operator model loads automatically on startup
         2. **Upload Screenshot**: Upload an Android device screenshot
         3. **Provide Instructions**: Enter your goal and step instructions
         4. **Get Actions**: The model will generate JSON actions for Android device control
         with gr.Row():
             with gr.Column(scale=1):
+                gr.Markdown("### 🤖 Model Status")
+                model_status = gr.Textbox(
+                    label="L-Operator Model",
+                    value="🔄 Loading model on startup...",
+                    interactive=False
+                )
                 gr.Markdown("### 📱 Input")
                 image_input = gr.Image(
                     label="Android Screenshot",
                     title="L-Operator Chat",
                     description="Chat with L-Operator using screenshots and text instructions",
                     examples=load_example_episodes(),
+                    type="messages"
                 )
                 gr.Markdown("### 🎯 Action Output")
                 )
         # Event handlers
         def on_generate_action(image, goal, step):
             if not image:
                 return {"error": "Please upload an image"}
             except:
                 return {"raw_response": response}
+        # Update model status on page load
+        def update_model_status():
+            if demo_instance.is_loaded:
+                return "✅ L-Operator model loaded and ready!"
+            else:
+                return "❌ Model failed to load. Please check logs."
         generate_btn.click(
             fn=on_generate_action,
             outputs=action_output
         )
+        # Update model status on page load
+        demo.load(
+            fn=update_model_status,
+            outputs=model_status
+        )
         # Update chat interface when image changes
         def update_chat_image(image):
             return image