llava-llama-3-8b-v1_1-gguf / OLLAMA_MODELFILE_INT4
pppppM's picture
Create OLLAMA_MODELFILE_INT4
13eff81 verified
raw
history blame
470 Bytes
FROM ./ggml-model-int4.gguf
FROM ./mmproj-model-f16.gguf
TEMPLATE """{{ if .System }}<|start_header_id|>system<|end_header_id|>
{{ .System }}<|eot_id|>{{ end }}{{ if .Prompt }}<|start_header_id|>user<|end_header_id|>
{{ .Prompt }}<|eot_id|>{{ end }}<|start_header_id|>assistant<|end_header_id|>
{{ .Response }}<|eot_id|>"""
PARAMETER stop "<|start_header_id|>"
PARAMETER stop "<|end_header_id|>"
PARAMETER stop "<|eot_id|>"
PARAMETER num_keep 4
PARAMETER num_ctx 4096