We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6dc9d41 commit a259effCopy full SHA for a259eff
examples/performance/compute_context_length/gemma3.py
@@ -38,7 +38,7 @@
38
model_id,
39
config=config,
40
attn_implementation="eager",
41
- kv_offload=False,
+ kv_offload=True,
42
qaic_config={
43
"ccl_enabled":True,
44
},
examples/performance/compute_context_length/molmo.py
@@ -33,7 +33,7 @@
33
34
qeff_model = QEFFAutoModelForCausalLM.from_pretrained(
35
36
37
trust_remote_code=True,
0 commit comments