mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2026-06-27 23:50:20 -05:00
server : hint preserve_thinking when supported by chat template
Print a hint to enable preserve_thinking kwarg when the template supports it. ref: https://docs.z.ai/guides/capabilities/thinking-mode#preserved-thinking Assisted-by: pi:llama.cpp/Qwen3.6-27B
This commit is contained in:
parent
eae7149824
commit
3deb4d1711
@ -1521,7 +1521,7 @@ private:
|
||||
if (params_base.use_jinja && common_chat_templates_support_preserve_thinking(chat_templates.get())) {
|
||||
auto it = params_base.default_template_kwargs.find("preserve_thinking");
|
||||
if (it == params_base.default_template_kwargs.end()) {
|
||||
SRV_WRN("%s\n", "chat template supports 'preserve_thinking' - consider using --chat-template-kwargs \"{\\\"preserve_thinking\\\": true}\"");
|
||||
SRV_WRN("%s\n", "chat template supports 'preserve_thinking' - consider using --chat-template-kwargs \"{\\\"preserve_thinking\\\": true}\" (ref: https://docs.z.ai/guides/capabilities/thinking-mode#preserved-thinking)");
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user