Baichuan-13B-Chat-Int4-Cpp

Runtime error

xuqinyang commited on Jul 25, 2023

Commit

40421bf

•

1 Parent(s): a6ba995

Update model.py

Files changed (1) hide show

model.py CHANGED Viewed

@@ -3,13 +3,13 @@ from typing import Iterator
-model_id = 'xuqinyang/baichuan-13b-chat-ggml-int8'
 from huggingface_hub import snapshot_download
 snapshot_download(model_id, local_dir="./")
 from llama_cpp import Llama
-llm = Llama(model_path="./ggml-model-q8_0.bin", n_ctx=4096,seed=-1)
 def run(message: str,
         chat_history: list[tuple[str, str]],

+model_id = 'xuqinyang/baichuan-13b-chat-ggml-int4'
 from huggingface_hub import snapshot_download
 snapshot_download(model_id, local_dir="./")
 from llama_cpp import Llama
+llm = Llama(model_path="./ggml-model-q4_0.bin", n_ctx=4096,seed=-1)
 def run(message: str,
         chat_history: list[tuple[str, str]],