Spaces:
Runtime error
Runtime error
init
Browse files- app.py +1 -1
- llava/conversation.py +1 -1
- llava/serve/gradio_web_server.py +1 -1
- pyproject.toml +1 -1
app.py
CHANGED
@@ -47,7 +47,7 @@ def start_worker(model_path: str, bits=4):
|
|
47 |
"--model-path",
|
48 |
model_path,
|
49 |
"--model-name",
|
50 |
-
'llava-v1
|
51 |
"--use-flash-attn",
|
52 |
]
|
53 |
if bits != 16:
|
|
|
47 |
"--model-path",
|
48 |
model_path,
|
49 |
"--model-name",
|
50 |
+
'llava-UGround-v1-4bit',
|
51 |
"--use-flash-attn",
|
52 |
]
|
53 |
if bits != 16:
|
llava/conversation.py
CHANGED
@@ -196,7 +196,7 @@ class Conversation:
|
|
196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
197 |
msg=img_str
|
198 |
if not extra_coordinates:
|
199 |
-
|
200 |
ret.append([msg, None])
|
201 |
break
|
202 |
return ret
|
|
|
196 |
img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
|
197 |
msg=img_str
|
198 |
if not extra_coordinates:
|
199 |
+
ret.append(["The element is at {extra_coordinates} on the screen:",None])
|
200 |
ret.append([msg, None])
|
201 |
break
|
202 |
return ret
|
llava/serve/gradio_web_server.py
CHANGED
@@ -447,7 +447,7 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
|
|
447 |
interactive=True,
|
448 |
show_label=False,
|
449 |
container=False)
|
450 |
-
# model_selector="llava-v1
|
451 |
|
452 |
imagebox = gr.Image(type="pil")
|
453 |
image_process_mode = gr.Radio(
|
|
|
447 |
interactive=True,
|
448 |
show_label=False,
|
449 |
container=False)
|
450 |
+
# model_selector="llava-UGround-v1-4bit"
|
451 |
|
452 |
imagebox = gr.Image(type="pil")
|
453 |
image_process_mode = gr.Radio(
|
pyproject.toml
CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4 |
|
5 |
[project]
|
6 |
name = "uground_demo_test"
|
7 |
-
version = "
|
8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
9 |
readme = "README.md"
|
10 |
requires-python = ">=3.8"
|
|
|
4 |
|
5 |
[project]
|
6 |
name = "uground_demo_test"
|
7 |
+
version = "4.0"
|
8 |
description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
|
9 |
readme = "README.md"
|
10 |
requires-python = ">=3.8"
|