fix(llama-swap): allow qwen thinking by default
This commit is contained in:
@@ -189,7 +189,6 @@ in
|
|||||||
--language-model-only
|
--language-model-only
|
||||||
--trust-remote-code
|
--trust-remote-code
|
||||||
--reasoning-parser qwen3
|
--reasoning-parser qwen3
|
||||||
--default-chat-template-kwargs '{"enable_thinking": false}'
|
|
||||||
--enable-auto-tool-choice
|
--enable-auto-tool-choice
|
||||||
--tool-call-parser qwen3_coder
|
--tool-call-parser qwen3_coder
|
||||||
--enable-prefix-caching
|
--enable-prefix-caching
|
||||||
@@ -330,7 +329,6 @@ in
|
|||||||
--kv-cache-dtype turboquant_3bit_nc
|
--kv-cache-dtype turboquant_3bit_nc
|
||||||
--trust-remote-code
|
--trust-remote-code
|
||||||
--reasoning-parser qwen3
|
--reasoning-parser qwen3
|
||||||
--default-chat-template-kwargs '{"enable_thinking": false}'
|
|
||||||
--enable-auto-tool-choice
|
--enable-auto-tool-choice
|
||||||
--tool-call-parser qwen3_coder
|
--tool-call-parser qwen3_coder
|
||||||
--enable-prefix-caching
|
--enable-prefix-caching
|
||||||
@@ -467,7 +465,6 @@ in
|
|||||||
--language-model-only
|
--language-model-only
|
||||||
--trust-remote-code
|
--trust-remote-code
|
||||||
--reasoning-parser qwen3
|
--reasoning-parser qwen3
|
||||||
--default-chat-template-kwargs '{"enable_thinking": false}'
|
|
||||||
--enable-auto-tool-choice
|
--enable-auto-tool-choice
|
||||||
--tool-call-parser qwen3_coder
|
--tool-call-parser qwen3_coder
|
||||||
--enable-prefix-caching
|
--enable-prefix-caching
|
||||||
|
|||||||
Reference in New Issue
Block a user