We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2016bf2 commit 96fbe00Copy full SHA for 96fbe00
1 file changed
src/llama-model.cpp
@@ -1636,7 +1636,8 @@ const float * llama_model::tensor_split() const {
1636
}
1637
1638
uint32_t llama_model::n_gpu_layers() const {
1639
- return params.n_gpu_layers >= 0 ? params.n_gpu_layers : hparams.n_layer() + 1;
+ // note: plus 1 for the "output" layer
1640
+ return params.n_gpu_layers >= 0 ? params.n_gpu_layers : hparams.n_layer_all + 1;
1641
1642
1643
llama_split_mode llama_model::split_mode() const {
0 commit comments