Files
ollama-utils/modelfile-repo/qwen3-8b-q5_k_m.Modelfile
2026-01-18 22:25:27 +01:00

31 lines
782 B
Plaintext

# ollama-utils-metadata
# hf_upstream: https://huggingface.co/Qwen/Qwen3-8B-GGUF/blob/main/qwen3-8b-q5_k_m.gguf
# capabilities: tools,thinking
FROM ./qwen3-8b-q5_k_m.gguf
# Context and output parameters
PARAMETER num_ctx 40960
PARAMETER num_predict 32768
# Sampling parameters (non-thinking mode)
PARAMETER temperature 0.7
PARAMETER top_p 0.8
PARAMETER top_k 20
PARAMETER min_p 0.00
PARAMETER repeat_penalty 1.0
PARAMETER presence_penalty 1.5
# Stop tokens
PARAMETER stop "<|im_start|>"
PARAMETER stop "<|im_end|>"
# Template for Qwen3 chat format
TEMPLATE """{{ if .System }}<|im_start|>system
{{ .System }}<|im_end|>
{{ end }}<|im_start|>user
{{ .Prompt }}<|im_end|>
<|im_start|>assistant
"""
SYSTEM """You are Qwen, created by Alibaba Cloud. You are a helpful assistant."""