h2ogpt-chatbot

Runtime error

pseudotensor commited on May 2, 2023

Commit

d5357c2

•

1 Parent(s): 31cc3ef

Update with h2oGPT hash c8a6d015ef453351b3c2dff18a23370f380278aa

Files changed (2) hide show

gradio_runner.py CHANGED Viewed

@@ -246,7 +246,7 @@ def go_gradio(**kwargs):
                                 value=kwargs['top_k'], label="Top k",
                                 info='Num. tokens to sample from'
                             )
-                            max_beams = 8 if not is_low_mem else 2
                             num_beams = gr.Slider(minimum=1, maximum=max_beams, step=1,
                                                   value=min(max_beams, kwargs['num_beams']), label="Beams",
                                                   info="Number of searches for optimal overall probability.  "
@@ -865,7 +865,7 @@ def go_gradio(**kwargs):
         # FIXME: have to click once to stop output and second time to stop GPUs going
         stop_btn.click(lambda: None, None, None,
                        cancels=[submit_event_nochat, submit_event, submit_event2, submit_event3],
-                       queue=False, api_name='stop' if allow_api else None).then(clear_torch_cache)
         demo.load(None, None, None, _js=get_dark_js() if kwargs['h2ocolors'] else None)
     demo.queue(concurrency_count=kwargs['concurrency_count'], api_open=kwargs['api_open'])

                                 value=kwargs['top_k'], label="Top k",
                                 info='Num. tokens to sample from'
                             )
+                            max_beams = 8 if not is_low_mem else 1
                             num_beams = gr.Slider(minimum=1, maximum=max_beams, step=1,
                                                   value=min(max_beams, kwargs['num_beams']), label="Beams",
                                                   info="Number of searches for optimal overall probability.  "
         # FIXME: have to click once to stop output and second time to stop GPUs going
         stop_btn.click(lambda: None, None, None,
                        cancels=[submit_event_nochat, submit_event, submit_event2, submit_event3],
+                       queue=False, api_name='stop' if allow_api else None).then(clear_torch_cache, queue=False)
         demo.load(None, None, None, _js=get_dark_js() if kwargs['h2ocolors'] else None)
     demo.queue(concurrency_count=kwargs['concurrency_count'], api_open=kwargs['api_open'])

prompter.py CHANGED Viewed

@@ -71,7 +71,8 @@ class Prompter(object):
                             output = output.split(self.pre_response)[1]
                             allow_terminate = True
                         else:
-                            print("Failure of parsing or not enough output yet: %s" % output, flush=True)
                             allow_terminate = False
                 else:
                     allow_terminate = True

                             output = output.split(self.pre_response)[1]
                             allow_terminate = True
                         else:
+                            if output:
+                                print("Failure of parsing or not enough output yet: %s" % output, flush=True)
                             allow_terminate = False
                 else:
                     allow_terminate = True