We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 59db9a3 commit 0842b9bCopy full SHA for 0842b9b
1 file changed
src/llama-model.cpp
@@ -7348,7 +7348,7 @@ bool llama_model::load_tensors(llama_model_loader & ml) {
7348
// ("rope_freqs.weight") and ggml uses only the first (n_rot_l/2) entries per layer.
7349
uint32_t n_rot_max = 0;
7350
for (int i = 0; i < n_layer; ++i) {
7351
- n_rot_max = std::max(n_rot_max, hparams.n_rot());
+ n_rot_max = std::max(n_rot_max, hparams.n_rot(i));
7352
}
7353
if (n_rot_max == 0) {
7354
n_rot_max = n_rot;
0 commit comments