xuqinyang commited on
Commit
40421bf
1 Parent(s): a6ba995

Update model.py

Browse files
Files changed (1) hide show
  1. model.py +2 -2
model.py CHANGED
@@ -3,13 +3,13 @@ from typing import Iterator
3
 
4
 
5
 
6
- model_id = 'xuqinyang/baichuan-13b-chat-ggml-int8'
7
 
8
  from huggingface_hub import snapshot_download
9
 
10
  snapshot_download(model_id, local_dir="./")
11
  from llama_cpp import Llama
12
- llm = Llama(model_path="./ggml-model-q8_0.bin", n_ctx=4096,seed=-1)
13
 
14
  def run(message: str,
15
  chat_history: list[tuple[str, str]],
 
3
 
4
 
5
 
6
+ model_id = 'xuqinyang/baichuan-13b-chat-ggml-int4'
7
 
8
  from huggingface_hub import snapshot_download
9
 
10
  snapshot_download(model_id, local_dir="./")
11
  from llama_cpp import Llama
12
+ llm = Llama(model_path="./ggml-model-q4_0.bin", n_ctx=4096,seed=-1)
13
 
14
  def run(message: str,
15
  chat_history: list[tuple[str, str]],