From a01f9e34eeec8675e2f5622d8f9b2974d391ab98 Mon Sep 17 00:00:00 2001 From: Evan Reichard Date: Tue, 12 May 2026 09:27:42 -0400 Subject: [PATCH] chore: tweak ctx --- modules/nixos/services/llama-swap/config.nix | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/modules/nixos/services/llama-swap/config.nix b/modules/nixos/services/llama-swap/config.nix index 0ab9713..cb38ea2 100644 --- a/modules/nixos/services/llama-swap/config.nix +++ b/modules/nixos/services/llama-swap/config.nix @@ -60,7 +60,7 @@ in # https://huggingface.co/unsloth/Qwen3.6-27B-GGUF-MTP/tree/main "qwen3.6-27b-udq4-thinking" = { name = "Qwen3.6 (27B) - Thinking (UD-Q4)"; - macros.ctx = "150000"; + macros.ctx = "140000"; cmd = '' ${llama-cpp}/bin/llama-server \ --port ''${PORT} \ @@ -609,7 +609,7 @@ in # https://huggingface.co/unsloth/Qwen3.6-27B-GGUF-MTP/tree/main "qwen3.6-27b-udq6-thinking" = { name = "Qwen3.6 (27B) - Thinking (UD-Q6)"; - macros.ctx = "225000"; + macros.ctx = "196608"; cmd = '' ${llama-cpp}/bin/llama-server \ --port ''${PORT} \