FROM ./llama-3-1b-medical-chatbot.gguf | |
# set the temperature to 1 [higher is more creative, lower is more coherent] | |
PARAMETER temperature 0.2 | |
PARAMETER top_p 0.9 | |
PARAMETER num_predict 256 | |
PARAMETER stop <|start_header_id|> | |
PARAMETER stop <|end_header_id|> | |
PARAMETER stop <|eot_id|> |