| FROM ./mistral_7b_instruct_v2_quant_v2-unsloth.Q4_K_M.gguf | |
| # sets the temperature to 1 [higher is more creative, lower is more coherent] | |
| PARAMETER temperature 1 | |
| # sets the context window size to 4096, this controls how many tokens the LLM can use as context to generate the next token | |
| PARAMETER num_ctx 4096 | |
| TEMPLATE """{{ if .System }}<|start_header_id|>system<|end_header_id|> | |
| {{ .System }}<|eot_id|>{{ end }}{{ if .Prompt }}<|start_header_id|>user<|end_header_id|> | |
| {{ .Prompt }}<|eot_id|>{{ end }}<|start_header_id|>assistant<|end_header_id|> | |
| {{ .Response }}<|eot_id|>""" | |
| PARAMETER stop "<|start_header_id|>" | |
| PARAMETER stop "<|end_header_id|>" | |
| PARAMETER stop "<|eot_id|>" | |
| PARAMETER stop "<|reserved_special_token" |