Spaces:
Runtime error
Runtime error
init
Browse files- llava/conversation.py +2 -1
- llava/serve/gradio_web_server.py +2 -2
- pyproject.toml +1 -1
llava/conversation.py
CHANGED
|
@@ -196,7 +196,8 @@ class Conversation:
|
|
| 196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
| 197 |
msg=img_str
|
| 198 |
if extra_coordinates:
|
| 199 |
-
ret.append(["The element is at {extra_coordinates} on the screen:",None])
|
|
|
|
| 200 |
ret.append([msg, None])
|
| 201 |
break
|
| 202 |
return ret
|
|
|
|
| 196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
| 197 |
msg=img_str
|
| 198 |
if extra_coordinates:
|
| 199 |
+
# msg=ret.append(["The element is at {extra_coordinates} on the screen:",None])+msg
|
| 200 |
+
msg = f"The element is at {extra_coordinates} on the screen:"+ msg
|
| 201 |
ret.append([msg, None])
|
| 202 |
break
|
| 203 |
return ret
|
llava/serve/gradio_web_server.py
CHANGED
|
@@ -397,7 +397,7 @@ def http_bot(state, model_selector, temperature, top_p, max_new_tokens, request:
|
|
| 397 |
|
| 398 |
title_markdown = ("""
|
| 399 |
# UGround: Universal Visual Grounding for GUI Agents
|
| 400 |
-
[[Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[Model](https://huggingface.co/osunlp/UGround)]
|
| 401 |
""")
|
| 402 |
|
| 403 |
tos_markdown = ("""
|
|
@@ -466,7 +466,7 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
|
|
| 466 |
# max_output_tokens=16384
|
| 467 |
#
|
| 468 |
with gr.Accordion("Parameters", open=False) as parameter_row:
|
| 469 |
-
temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0
|
| 470 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
|
| 471 |
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
|
| 472 |
|
|
|
|
| 397 |
|
| 398 |
title_markdown = ("""
|
| 399 |
# UGround: Universal Visual Grounding for GUI Agents
|
| 400 |
+
[[π Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[πModel](https://huggingface.co/osunlp/UGround)][[πPaper](https://arxiv.org/abs/2410.05243)]
|
| 401 |
""")
|
| 402 |
|
| 403 |
tos_markdown = ("""
|
|
|
|
| 466 |
# max_output_tokens=16384
|
| 467 |
#
|
| 468 |
with gr.Accordion("Parameters", open=False) as parameter_row:
|
| 469 |
+
temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Temperature",)
|
| 470 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
|
| 471 |
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
|
| 472 |
|
pyproject.toml
CHANGED
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
| 4 |
|
| 5 |
[project]
|
| 6 |
name = "uground_demo_test"
|
| 7 |
-
version = "4.
|
| 8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
| 9 |
readme = "README.md"
|
| 10 |
requires-python = ">=3.8"
|
|
|
|
| 4 |
|
| 5 |
[project]
|
| 6 |
name = "uground_demo_test"
|
| 7 |
+
version = "4.2"
|
| 8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
| 9 |
readme = "README.md"
|
| 10 |
requires-python = ">=3.8"
|