Spaces:

h2oai
/

h2ovl-mississippi

Running on A10G

App Files Files Community

Shanshan Wang commited on 2 days ago

Commit

d6bfd67

•

1 Parent(s): 2d6f1c5

use model.ocr for 0.8b model

Browse files

Files changed (1) hide show

app.py +44 -20

app.py CHANGED Viewed

@@ -125,15 +125,28 @@ def inference(image_input,
     )
     # Call model.chat with history
-    response_text, new_state = model.chat(
-        tokenizer,
-        image_input,
-        user_message,
-        max_tiles = int(tile_num),
-        generation_config=generation_config,
-        history=state,
-        return_history=True
-    )
     # update the satet with new_state
     state = new_state
@@ -197,17 +210,28 @@ def regenerate_response(chatbot,
         top_p= float(top_p),
     )
     # Regenerate the response
-    response_text, new_state = model.chat(
-        tokenizer,
-        image_input,
-        last_user_message,
-        max_tiles = int(tile_num),
-        generation_config=generation_config,
-        history=state,  # Exclude last assistant's response
-        return_history=True
-    )
     # Update the state with new_state
     state = new_state
@@ -304,7 +328,7 @@ with gr.Blocks() as demo:
                 interactive=True,
                 label="Top P")
             max_new_tokens_input = gr.Slider(
-                minimum=0,
                 maximum=4096,
                 step=64,
                 value=1024,

     )
     # Call model.chat with history
+    if '2b' in model_name.lower():
+        response_text, new_state = model.chat(
+            tokenizer,
+            image_input,
+            user_message,
+            max_tiles = int(tile_num),
+            generation_config=generation_config,
+            history=state,
+            return_history=True
+        )
+    if '0.8b' in model_name.lower():
+        response_text, new_state = model.ocr(
+            tokenizer,
+            image_input,
+            user_message,
+            max_tiles = int(tile_num),
+            generation_config=generation_config,
+            history=state,
+            return_history=True
+        )
     # update the satet with new_state
     state = new_state
         top_p= float(top_p),
     )
     # Regenerate the response
+    if '2b' in model_name.lower():
+        response_text, new_state = model.chat(
+            tokenizer,
+            image_input,
+            last_user_message,
+            max_tiles = int(tile_num),
+            generation_config=generation_config,
+            history=state,  # Exclude last assistant's response
+            return_history=True
+        )
+    if '0.8b' in model_name.lower():
+        response_text, new_state = model.ocr(
+            tokenizer,
+            image_input,
+            last_user_message,
+            max_tiles = int(tile_num),
+            generation_config=generation_config,
+            history=state,  # Exclude last assistant's response
+            return_history=True
+        )
     # Update the state with new_state
     state = new_state
                 interactive=True,
                 label="Top P")
             max_new_tokens_input = gr.Slider(
+                minimum=64,
                 maximum=4096,
                 step=64,
                 value=1024,