From ceff33273d857d57cb427e0e82028dda330c70cd Mon Sep 17 00:00:00 2001 From: Evan Reichard Date: Thu, 16 Apr 2026 16:20:00 -0400 Subject: [PATCH] feat(llama-swap): add Qwen3.6-35B-A3B model configuration --- modules/nixos/services/llama-swap/config.nix | 26 ++++++++++++++++++++ 1 file changed, 26 insertions(+) diff --git a/modules/nixos/services/llama-swap/config.nix b/modules/nixos/services/llama-swap/config.nix index d1c8162..76e8458 100644 --- a/modules/nixos/services/llama-swap/config.nix +++ b/modules/nixos/services/llama-swap/config.nix @@ -124,6 +124,32 @@ in }; }; + # https://huggingface.co/unsloth/Qwen3.6-35B-A3B-GGUF/tree/main + "qwen3.6-35b-thinking" = { + name = "Qwen3.6 (35B) - Thinking"; + macros.ctx = "262144"; + cmd = '' + ${llama-cpp}/bin/llama-server \ + --port ''${PORT} \ + -m /mnt/ssd/Models/Qwen3.6/Qwen3.6-35B-A3B-UD-IQ4_XS.gguf \ + -c ''${ctx} \ + --temp 0.6 \ + --top-p 0.95 \ + --top-k 20 \ + --min-p 0.0 \ + --presence-penalty 0.0 \ + --repeat-penalty 1.0 \ + -dev CUDA0 \ + -fit off + ''; + metadata = { + type = [ + "text-generation" + "coding" + ]; + }; + }; + # https://huggingface.co/bartowski/Qwen_Qwen3.5-27B-GGUF/tree/main "qwen3.5-27b-thinking" = { name = "Qwen3.5 (27B) - Thinking";