File size: 266 Bytes
64777a0
 
 
 
 
1
2
3
4
5
FROM llama.gguf
# sets the temperature to 1 [higher is more creative, lower is more coherent]
PARAMETER temperature 0.1
# sets the context window size to 4096, this controls how many tokens the LLM can use as context to generate the next token
PARAMETER num_ctx 1024