Spaces:
Running
Running
FROM llama.gguf | |
# sets the temperature to 1 [higher is more creative, lower is more coherent] | |
PARAMETER temperature 0.1 | |
# sets the context window size to 4096, this controls how many tokens the LLM can use as context to generate the next token | |
PARAMETER num_ctx 1024 |