BoyuNLP commited on
Commit
1aaea48
1 Parent(s): cf4e43c
Files changed (2) hide show
  1. llava/serve/gradio_web_server.py +10 -2
  2. pyproject.toml +1 -1
llava/serve/gradio_web_server.py CHANGED
@@ -31,6 +31,7 @@ from PIL import Image
31
  import io
32
  import base64
33
 
 
34
  def resize_image(image, default_width=(1344, 896), request_width=None):
35
  # 如果 request 中指定了 width,则使用传入的值
36
  if request_width:
@@ -38,7 +39,7 @@ def resize_image(image, default_width=(1344, 896), request_width=None):
38
 
39
  original_width, original_height = image.size
40
 
41
- print(original_width,original_height)
42
 
43
  # 根据宽高比决定 resize 逻辑
44
  if original_width >= original_height:
@@ -54,7 +55,14 @@ def resize_image(image, default_width=(1344, 896), request_width=None):
54
 
55
  # 调整图像大小
56
  resized_image = image.resize((new_width, new_height))
57
- print(new_width,new_height)
 
 
 
 
 
 
 
58
  return resized_image
59
 
60
 
 
31
  import io
32
  import base64
33
 
34
+
35
  def resize_image(image, default_width=(1344, 896), request_width=None):
36
  # 如果 request 中指定了 width,则使用传入的值
37
  if request_width:
 
39
 
40
  original_width, original_height = image.size
41
 
42
+ print("Original size:", original_width, original_height)
43
 
44
  # 根据宽高比决定 resize 逻辑
45
  if original_width >= original_height:
 
55
 
56
  # 调整图像大小
57
  resized_image = image.resize((new_width, new_height))
58
+ print("After initial resize:", new_width, new_height)
59
+
60
+ # 如果高度仍然超过 2016,则将图片固定调整为 896x2016
61
+ if new_height > 2016:
62
+ new_width, new_height = 672, 2016
63
+ resized_image = resized_image.resize((new_width, new_height))
64
+ print("Adjusted to fixed size:", new_width, new_height)
65
+
66
  return resized_image
67
 
68
 
pyproject.toml CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
 
5
  [project]
6
  name = "uground_demo_test"
7
- version = "3.5"
8
  description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
9
  readme = "README.md"
10
  requires-python = ">=3.8"
 
4
 
5
  [project]
6
  name = "uground_demo_test"
7
+ version = "3.6"
8
  description = "Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents"
9
  readme = "README.md"
10
  requires-python = ">=3.8"