qwen modelfiles

This commit is contained in:
2026-01-18 22:21:00 +01:00
parent c40874d7f0
commit 197e3b9037
6 changed files with 180 additions and 0 deletions

View File

@@ -0,0 +1,30 @@
# ollama-utils-metadata
# hf_upstream: https://huggingface.co/Qwen/Qwen3-14B-GGUF/blob/main/qwen3-14b-q5_k_m.gguf
# capabilities: general
FROM ./qwen3-14b-q5_k_m.gguf
# Context and output parameters
PARAMETER num_ctx 40960
PARAMETER num_predict 32768
# Sampling parameters (non-thinking mode)
PARAMETER temperature 0.7
PARAMETER top_p 0.8
PARAMETER top_k 20
PARAMETER min_p 0.00
PARAMETER repeat_penalty 1.0
PARAMETER presence_penalty 1.5
# Stop tokens
PARAMETER stop "<|im_start|>"
PARAMETER stop "<|im_end|>"
# Template for Qwen3 chat format
TEMPLATE """{{ if .System }}<|im_start|>system
{{ .System }}<|im_end|>
{{ end }}<|im_start|>user
{{ .Prompt }}<|im_end|>
<|im_start|>assistant
"""
SYSTEM """You are Qwen, created by Alibaba Cloud. You are a helpful assistant."""