Kai Jennissen
commited on
updated tools description
Browse files
agent.py
CHANGED
|
@@ -161,6 +161,7 @@ def get_agent():
|
|
| 161 |
model_id="Qwen/Qwen2.5-VL-32B-Instruct", # provider="together"
|
| 162 |
),
|
| 163 |
max_steps=3,
|
|
|
|
| 164 |
name="Multimedia_Agent",
|
| 165 |
description="An agent that can process and analyze images, audio, video, and other files. It needs to be provided with a valid URL to fetch the file.",
|
| 166 |
verbosity_level=1,
|
|
@@ -192,7 +193,7 @@ def get_agent():
|
|
| 192 |
model=OpenAIServerModel(model_id="gpt-4.1", temperature=0.1),
|
| 193 |
max_steps=5,
|
| 194 |
planning_interval=10,
|
| 195 |
-
additional_authorized_imports=["pandas", "numpy"],
|
| 196 |
verbosity_level=2,
|
| 197 |
)
|
| 198 |
|
|
|
|
| 161 |
model_id="Qwen/Qwen2.5-VL-32B-Instruct", # provider="together"
|
| 162 |
),
|
| 163 |
max_steps=3,
|
| 164 |
+
additional_authorized_imports=["pandas", "numpy", "openpyxl"],
|
| 165 |
name="Multimedia_Agent",
|
| 166 |
description="An agent that can process and analyze images, audio, video, and other files. It needs to be provided with a valid URL to fetch the file.",
|
| 167 |
verbosity_level=1,
|
|
|
|
| 193 |
model=OpenAIServerModel(model_id="gpt-4.1", temperature=0.1),
|
| 194 |
max_steps=5,
|
| 195 |
planning_interval=10,
|
| 196 |
+
additional_authorized_imports=["pandas", "numpy", "openpyxl"],
|
| 197 |
verbosity_level=2,
|
| 198 |
)
|
| 199 |
|
app.py
CHANGED
|
@@ -109,7 +109,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
|
|
| 109 |
results_log = []
|
| 110 |
answers_payload = []
|
| 111 |
print(f"Running agent on {len(questions_data)} questions...")
|
| 112 |
-
for item in questions_data
|
| 113 |
task_id = item.get("task_id")
|
| 114 |
question_text = item.get("question")
|
| 115 |
if not task_id or question_text is None:
|
|
|
|
| 109 |
results_log = []
|
| 110 |
answers_payload = []
|
| 111 |
print(f"Running agent on {len(questions_data)} questions...")
|
| 112 |
+
for item in questions_data:
|
| 113 |
task_id = item.get("task_id")
|
| 114 |
question_text = item.get("question")
|
| 115 |
if not task_id or question_text is None:
|
tools.py
CHANGED
|
@@ -551,13 +551,35 @@ def process_binary(response, filename, content_type):
|
|
| 551 |
@tool
|
| 552 |
def fetch_task_files(url: str) -> Dict[str, Any]:
|
| 553 |
"""
|
| 554 |
-
Download files from a given URL.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 555 |
|
| 556 |
Args:
|
| 557 |
-
url (str): Direct URL to the file to download.
|
|
|
|
| 558 |
|
| 559 |
Returns:
|
| 560 |
-
dict: A dictionary
|
| 561 |
"""
|
| 562 |
files_url = url
|
| 563 |
print(f"Fetching file from: {files_url}")
|
|
|
|
| 551 |
@tool
|
| 552 |
def fetch_task_files(url: str) -> Dict[str, Any]:
|
| 553 |
"""
|
| 554 |
+
Download and process files from a given URL. This tool detects the file type and returns the data in a suitable format for further processing.
|
| 555 |
+
|
| 556 |
+
For different file types, this tool returns:
|
| 557 |
+
|
| 558 |
+
- Images: Returns a data_url that can be directly used with the read_image tool
|
| 559 |
+
Example: result = fetch_task_files(url); then use read_image(question, result["data_url"])
|
| 560 |
+
|
| 561 |
+
- Audio: Returns audio data that can be used with the transcribe_audio tool
|
| 562 |
+
Example: result = fetch_task_files(url); then use transcribe_audio(result["data_url"], result["filename"])
|
| 563 |
+
|
| 564 |
+
- Video: Returns frame extractions and a video buffer for processing with run_video
|
| 565 |
+
Example: result = fetch_task_files(url); you can access frames via result["frame_urls"]
|
| 566 |
+
|
| 567 |
+
- Tabular data (Excel/CSV): Returns parsed data as records, column names, and dimensions
|
| 568 |
+
Example: result = fetch_task_files(url); then analyze data with result["data"] and result["columns"]
|
| 569 |
+
|
| 570 |
+
- Text/Code: Returns the content as text for analysis
|
| 571 |
+
Example: result = fetch_task_files(url); then access text via result["content"]
|
| 572 |
+
|
| 573 |
+
- PDFs & other files: Returns encoded file data for processing
|
| 574 |
+
|
| 575 |
+
All responses include metadata like file_type, filename, and content_type to help determine how to handle the file.
|
| 576 |
|
| 577 |
Args:
|
| 578 |
+
url (str): Direct URL to the file to download. For task files, construct using the API base URL
|
| 579 |
+
and the task ID (e.g., "https://agents-course-unit4-scoring.hf.space/files/{task_id}")
|
| 580 |
|
| 581 |
Returns:
|
| 582 |
+
dict: A dictionary with file data and metadata structured for the specific file type
|
| 583 |
"""
|
| 584 |
files_url = url
|
| 585 |
print(f"Fetching file from: {files_url}")
|