BoyuNLP commited on
Commit
125a54b
β€’
1 Parent(s): ead51e3
llava/conversation.py CHANGED
@@ -196,7 +196,8 @@ class Conversation:
196
  img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
197
  msg=img_str
198
  if extra_coordinates:
199
- ret.append(["The element is at {extra_coordinates} on the screen:",None])
 
200
  ret.append([msg, None])
201
  break
202
  return ret
 
196
  img_str = f'<img src="data:image/jpeg;base64,{img_b64_str}" alt="user upload image" />'
197
  msg=img_str
198
  if extra_coordinates:
199
+ # msg=ret.append(["The element is at {extra_coordinates} on the screen:",None])+msg
200
+ msg = f"The element is at {extra_coordinates} on the screen:"+ msg
201
  ret.append([msg, None])
202
  break
203
  return ret
llava/serve/gradio_web_server.py CHANGED
@@ -397,7 +397,7 @@ def http_bot(state, model_selector, temperature, top_p, max_new_tokens, request:
397
 
398
  title_markdown = ("""
399
  # UGround: Universal Visual Grounding for GUI Agents
400
- [[Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[Model](https://huggingface.co/osunlp/UGround)] | πŸ“š [[Paper](https://arxiv.org/abs/2410.05243)]]
401
  """)
402
 
403
  tos_markdown = ("""
@@ -466,7 +466,7 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
466
  # max_output_tokens=16384
467
  #
468
  with gr.Accordion("Parameters", open=False) as parameter_row:
469
- temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0.1, step=0.1, interactive=True, label="Temperature",)
470
  top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
471
  max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
472
 
 
397
 
398
  title_markdown = ("""
399
  # UGround: Universal Visual Grounding for GUI Agents
400
+ [[🏠Project Homepage](https://osu-nlp-group.github.io/UGround/)] [[Code](https://github.com/OSU-NLP-Group/UGround)] [[😊Model](https://huggingface.co/osunlp/UGround)][[πŸ“šPaper](https://arxiv.org/abs/2410.05243)]
401
  """)
402
 
403
  tos_markdown = ("""
 
466
  # max_output_tokens=16384
467
  #
468
  with gr.Accordion("Parameters", open=False) as parameter_row:
469
+ temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Temperature",)
470
  top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0, step=0.1, interactive=True, label="Top P",)
471
  max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
472
 
pyproject.toml CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
 
5
  [project]
6
  name = "uground_demo_test"
7
- version = "4.1"
8
  description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
9
  readme = "README.md"
10
  requires-python = ">=3.8"
 
4
 
5
  [project]
6
  name = "uground_demo_test"
7
+ version = "4.2"
8
  description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
9
  readme = "README.md"
10
  requires-python = ">=3.8"