We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent eb4e399 commit 8ba4d39Copy full SHA for 8ba4d39
src/llama-context.cpp
@@ -1389,6 +1389,13 @@ void llama_context::output_reorder() {
1389
uint32_t llama_context::graph_max_nodes() const {
1390
if (model.arch == LLM_ARCH_QWEN3NEXT) {
1391
return std::max<uint32_t>(8192u, 32u*model.n_tensors());
1392
+ } else if (
1393
+ model.arch == LLM_ARCH_GRANITE_HYBRID ||
1394
+ model.arch == LLM_ARCH_MAMBA2 ||
1395
+ model.arch == LLM_ARCH_FALCON_H1 ||
1396
+ model.arch == LLM_ARCH_NEMOTRON_H
1397
+ ) {
1398
+ return std::max<uint32_t>(1024u, 16u*model.n_tensors());
1399
}
1400
return std::max<uint32_t>(1024u, 8u*model.n_tensors());
1401
0 commit comments