|
FROM ./mistral_7b_instruct_v2_quant_v2-unsloth.Q4_K_M.gguf |
|
|
|
# sets the temperature to 1 [higher is more creative, lower is more coherent] |
|
PARAMETER temperature 1 |
|
# sets the context window size to 4096, this controls how many tokens the LLM can use as context to generate the next token |
|
PARAMETER num_ctx 4096 |
|
|
|
|
|
TEMPLATE """{{ if .System }}<|start_header_id|>system<|end_header_id|> |
|
|
|
{{ .System }}<|eot_id|>{{ end }}{{ if .Prompt }}<|start_header_id|>user<|end_header_id|> |
|
|
|
{{ .Prompt }}<|eot_id|>{{ end }}<|start_header_id|>assistant<|end_header_id|> |
|
|
|
{{ .Response }}<|eot_id|>""" |
|
PARAMETER stop "<|start_header_id|>" |
|
PARAMETER stop "<|end_header_id|>" |
|
PARAMETER stop "<|eot_id|>" |
|
PARAMETER stop "<|reserved_special_token" |