From f5591709609312006aa40a9f33f13fbb0393052e4d3b8938cc93e8738c2ad98e Mon Sep 17 00:00:00 2001 From: mstoeck3 Date: Mon, 19 Jan 2026 09:47:55 +0100 Subject: [PATCH] fix qwen3 modelfiles to include quantization info --- modelfile-repo/qwen3-14b-q4_k_m.Modelfile | 1 + modelfile-repo/qwen3-14b-q5_k_m.Modelfile | 1 + modelfile-repo/qwen3-14b-q8_0.Modelfile | 1 + modelfile-repo/qwen3-8b-q4_k_m.Modelfile | 1 + modelfile-repo/qwen3-8b-q5_k_m.Modelfile | 1 + modelfile-repo/qwen3-8b-q8_0.Modelfile | 1 + 6 files changed, 6 insertions(+) diff --git a/modelfile-repo/qwen3-14b-q4_k_m.Modelfile b/modelfile-repo/qwen3-14b-q4_k_m.Modelfile index 6ac491d..8bafa1e 100644 --- a/modelfile-repo/qwen3-14b-q4_k_m.Modelfile +++ b/modelfile-repo/qwen3-14b-q4_k_m.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-14B-GGUF +# quantization: q4_k_m # capabilities: tools,thinking FROM ./qwen3-14b-q4_k_m.gguf diff --git a/modelfile-repo/qwen3-14b-q5_k_m.Modelfile b/modelfile-repo/qwen3-14b-q5_k_m.Modelfile index d7c2c93..0122ae4 100644 --- a/modelfile-repo/qwen3-14b-q5_k_m.Modelfile +++ b/modelfile-repo/qwen3-14b-q5_k_m.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-14B-GGUF +# quantization: q5_k_m # capabilities: tools,thinking FROM ./qwen3-14b-q5_k_m.gguf diff --git a/modelfile-repo/qwen3-14b-q8_0.Modelfile b/modelfile-repo/qwen3-14b-q8_0.Modelfile index 538c06d..f8e3ccf 100644 --- a/modelfile-repo/qwen3-14b-q8_0.Modelfile +++ b/modelfile-repo/qwen3-14b-q8_0.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-14B-GGUF +# quantization: q8_0 # capabilities: tools,thinking FROM ./qwen3-14b-q8_0.gguf diff --git a/modelfile-repo/qwen3-8b-q4_k_m.Modelfile b/modelfile-repo/qwen3-8b-q4_k_m.Modelfile index 30ea258..a2837aa 100644 --- a/modelfile-repo/qwen3-8b-q4_k_m.Modelfile +++ b/modelfile-repo/qwen3-8b-q4_k_m.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-8B-GGUF +# quantization: q4_k_m # capabilities: tools,thinking FROM ./qwen3-8b-q4_k_m.gguf diff --git a/modelfile-repo/qwen3-8b-q5_k_m.Modelfile b/modelfile-repo/qwen3-8b-q5_k_m.Modelfile index e51b1cb..12fb4de 100644 --- a/modelfile-repo/qwen3-8b-q5_k_m.Modelfile +++ b/modelfile-repo/qwen3-8b-q5_k_m.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-8B-GGUF +# quantization: q5_k_m # capabilities: tools,thinking FROM ./qwen3-8b-q5_k_m.gguf diff --git a/modelfile-repo/qwen3-8b-q8_0.Modelfile b/modelfile-repo/qwen3-8b-q8_0.Modelfile index 829ad76..0f8dfca 100644 --- a/modelfile-repo/qwen3-8b-q8_0.Modelfile +++ b/modelfile-repo/qwen3-8b-q8_0.Modelfile @@ -1,5 +1,6 @@ # ollama-utils-metadata # hf_upstream: https://huggingface.co/Qwen/Qwen3-8B-GGUF +# quantization: q8_0 # capabilities: tools,thinking FROM ./qwen3-8b-q8_0.gguf