Spaces:

amberborici
/

Qwen-Qwen2-VL-7B-Instruct

Running

App Files Files Community

amberborici commited on Aug 8

Commit

f712aee

1 Parent(s): 15d32eb

sddsd

Browse files

Files changed (1) hide show

app.py +15 -28

app.py CHANGED Viewed

@@ -6,6 +6,13 @@ qwen_model = gr.load("models/Qwen/Qwen2-VL-7B-Instruct")
 def process_images(images, prompt):
     """
     Process multiple images with the Qwen2-VL model
     """
     if not images:
         return "Please upload at least one image."
@@ -17,35 +24,15 @@ def process_images(images, prompt):
             continue
         try:
-            # Prepare the message for the model
-            message = [
-                {
-                    "role": "user",
-                    "content": [
-                        {
-                            "type": "text",
-                            "text": prompt
-                        },
-                        {
-                            "type": "image_url",
-                            "image_url": {
-                                "url": image
-                            }
-                        }
-                    ]
-                }
-            ]
-            # Generate response using the loaded model
-            response = qwen_model.chat.completions.create(
-                model="Qwen/Qwen2-VL-7B-Instruct",
-                messages=message,
-                max_tokens=512,
-                temperature=0.7
             )
-            # Extract the response text
-            description = response.choices[0].message.content
             results.append(f"Image {i+1}: {description}")
         except Exception as e:
@@ -154,4 +141,4 @@ with gr.Blocks(
 # Launch the app
 if __name__ == "__main__":
-    demo.launch()

 def process_images(images, prompt):
     """
     Process multiple images with the Qwen2-VL model
+    Args:
+        images: List of uploaded images
+        prompt: User-provided prompt
+    Returns:
+        List of generated descriptions
     """
     if not images:
         return "Please upload at least one image."
             continue
         try:
+            # For vision models, we pass the image and text directly
+            # The model expects the image and prompt as separate arguments
+            response = qwen_model(
+                prompt,  # Text prompt
+                image    # Image file
             )
+            # The response should be the generated text
+            description = response
             results.append(f"Image {i+1}: {description}")
         except Exception as e:
 # Launch the app
 if __name__ == "__main__":
+    demo.launch()