Spaces:
Running
on
A10G
Running
on
A10G
init
Browse files- llava/conversation.py +2 -1
- llava/serve/gradio_web_server.py +2 -2
- pyproject.toml +1 -1
llava/conversation.py
CHANGED
@@ -196,7 +196,8 @@ class Conversation:
|
|
196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
197 |
msg=img_str
|
198 |
if extra_coordinates:
|
199 |
-
ret.append(["The element is at {extra_coordinates} on the screen:",None])
|
|
|
200 |
ret.append([msg, None])
|
201 |
break
|
202 |
return ret
|
|
|
196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
197 |
msg=img_str
|
198 |
if extra_coordinates:
|
199 |
+
# msg=ret.append(["The element is at {extra_coordinates} on the screen:",None])+msg
|
200 |
+
msg = f"The element is at {extra_coordinates} on the screen:"+ msg
|
201 |
ret.append([msg, None])
|
202 |
break
|
203 |
return ret
|
llava/serve/gradio_web_server.py
CHANGED
@@ -397,7 +397,7 @@ def http_bot(state, model_selector, temperature, top_p, max_new_tokens, request:
|
|
397 |
|
398 |
title_markdown = ("""
|
399 |
# UGround: Universal Visual Grounding for GUI Agents
|
400 |
-
[[Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[Model](https://huggingface.co/osunlp/UGround)]
|
401 |
""")
|
402 |
|
403 |
tos_markdown = ("""
|
@@ -466,7 +466,7 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
|
|
466 |
# max_output_tokens=16384
|
467 |
#
|
468 |
with gr.Accordion("Parameters", open=False) as parameter_row:
|
469 |
-
temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0
|
470 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
|
471 |
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
|
472 |
|
|
|
397 |
|
398 |
title_markdown = ("""
|
399 |
# UGround: Universal Visual Grounding for GUI Agents
|
400 |
+
[[π Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[πModel](https://huggingface.co/osunlp/UGround)][[πPaper](https://arxiv.org/abs/2410.05243)]
|
401 |
""")
|
402 |
|
403 |
tos_markdown = ("""
|
|
|
466 |
# max_output_tokens=16384
|
467 |
#
|
468 |
with gr.Accordion("Parameters", open=False) as parameter_row:
|
469 |
+
temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Temperature",)
|
470 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
|
471 |
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
|
472 |
|
pyproject.toml
CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4 |
|
5 |
[project]
|
6 |
name = "uground_demo_test"
|
7 |
-
version = "4.
|
8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
9 |
readme = "README.md"
|
10 |
requires-python = ">=3.8"
|
|
|
4 |
|
5 |
[project]
|
6 |
name = "uground_demo_test"
|
7 |
+
version = "4.2"
|
8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
9 |
readme = "README.md"
|
10 |
requires-python = ">=3.8"
|