nacujapj7 commited on
Commit
ff2dfa9
1 Parent(s): db92ed0

fix(Llama): increase window context to 1024

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -9,7 +9,7 @@ from llama_cpp import Llama
9
  from huggingface_hub import hf_hub_download
10
 
11
  hf_hub_download(repo_id="TheBloke/dolphin-2_6-phi-2-GGUF", filename="dolphin-2_6-phi-2.Q5_K_S.gguf", local_dir=".")
12
- llm = Llama(model_path="./dolphin-2_6-phi-2.Q5_K_S.gguf", n_ctx=512, last_n_tokens_size=256, n_threads=4, n_gpu_layers=0)
13
 
14
  ins = '''<|im_start|>user
15
  {question}<|im_end|>
 
9
  from huggingface_hub import hf_hub_download
10
 
11
  hf_hub_download(repo_id="TheBloke/dolphin-2_6-phi-2-GGUF", filename="dolphin-2_6-phi-2.Q5_K_S.gguf", local_dir=".")
12
+ llm = Llama(model_path="./dolphin-2_6-phi-2.Q5_K_S.gguf", n_ctx=1024)
13
 
14
  ins = '''<|im_start|>user
15
  {question}<|im_end|>