mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2026-06-27 23:50:20 -05:00
server: fix router args not being forwarded to child instances (#24760)
This commit is contained in:
parent
24bba7b98e
commit
968c43891a
@ -351,6 +351,12 @@ void server_models::load_models() {
|
||||
source_map[name] = SERVER_MODEL_SOURCE_PRESET;
|
||||
}
|
||||
|
||||
// overlay router's own CLI args on top of every model preset so that
|
||||
// e.g. `llama-server --temp 0` is honoured by all child processes
|
||||
for (auto & [name, preset] : final_presets) {
|
||||
preset.merge(base_preset);
|
||||
}
|
||||
|
||||
auto get_source = [&](const std::string & name) {
|
||||
return source_map.count(name) ? source_map.at(name) : SERVER_MODEL_SOURCE_PRESET;
|
||||
};
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user