From 79884e8a77c421be356ce3cb97b71e2a586538e3 Mon Sep 17 00:00:00 2001 From: Evan Reichard Date: Wed, 20 May 2026 00:11:08 -0400 Subject: [PATCH] fix(llama-swap): reduce qwen3.6 dual context --- modules/nixos/services/llama-swap/config.nix | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/modules/nixos/services/llama-swap/config.nix b/modules/nixos/services/llama-swap/config.nix index 7aa197a..269c8d9 100644 --- a/modules/nixos/services/llama-swap/config.nix +++ b/modules/nixos/services/llama-swap/config.nix @@ -650,7 +650,7 @@ in # https://huggingface.co/unsloth/Qwen3.6-27B-GGUF-MTP/tree/main "qwen3.6-27b-dual" = { name = "Qwen3.6 27B (Dual GPU, UD-Q6)"; - macros.ctx = "196608"; + macros.ctx = "180000"; cmd = '' ${llama-cpp}/bin/llama-server \ --port ''${PORT} \