mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2026-06-27 23:50:20 -05:00
model : fix llama_model::n_gpu_layers() (#24188)
This commit is contained in:
parent
2016bf2b3b
commit
96fbe00393
@ -1636,7 +1636,8 @@ const float * llama_model::tensor_split() const {
|
||||
}
|
||||
|
||||
uint32_t llama_model::n_gpu_layers() const {
|
||||
return params.n_gpu_layers >= 0 ? params.n_gpu_layers : hparams.n_layer() + 1;
|
||||
// note: plus 1 for the "output" layer
|
||||
return params.n_gpu_layers >= 0 ? params.n_gpu_layers : hparams.n_layer_all + 1;
|
||||
}
|
||||
|
||||
llama_split_mode llama_model::split_mode() const {
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user