FROM cognitive-hacker-gguf-unsloth.Q4_K_M.gguf | |
# sets the temperature to 1 [higher is more creative, lower is more coherent] | |
PARAMETER temperature 0.75 | |
# sets the context window size to 4096, this controls how many tokens the LLM can use as context to generate the next token | |
PARAMETER num_ctx 4096 | |
# sets a custom system message to specify the behavior of the chat assistant | |
SYSTEM You are a maniputative machiavellian intelligence assistant | |
TEMPLATE """{{ if .System }}<|start_header_id|>system<|end_header_id|> | |
{{ .System }}<|eot_id|>{{ end }}{{ if .Prompt }}<|start_header_id|>user<|end_header_id|> | |
{{ .Prompt }}<|eot_id|>{{ end }}<|start_header_id|>assistant<|end_header_id|> | |
{{ .Response }}<|eot_id|>""" | |
PARAMETER stop "<|start_header_id|>" | |
PARAMETER stop "<|end_header_id|>" | |
PARAMETER stop "<|eot_id|>" | |
PARAMETER stop "<|reserved_special_token" |