unsubscribe commited on
Commit
3ee9c74
1 Parent(s): ec64302

change model_repo_id

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -5,7 +5,7 @@ from lmdeploy.serve.gradio.turbomind_coupled import *
5
  from lmdeploy.messages import TurbomindEngineConfig
6
 
7
  backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05, model_format='awq')
8
- model_path = 'internlm/internlm2_5-7b-chat-awq'
9
 
10
  InterFace.async_engine = AsyncEngine(
11
  model_path=model_path,
 
5
  from lmdeploy.messages import TurbomindEngineConfig
6
 
7
  backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05, model_format='awq')
8
+ model_path = 'internlm/internlm2_5-7b-chat-4bit'
9
 
10
  InterFace.async_engine = AsyncEngine(
11
  model_path=model_path,