-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathindex.html
More file actions
762 lines (711 loc) · 68.6 KB
/
index.html
File metadata and controls
762 lines (711 loc) · 68.6 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>VRAM vs Context — ollama-0.18.0 / B6000</title>
<style>
*, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
body {
font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
background: #0f0f0f;
color: #e0e0e0;
min-height: 100vh;
padding: 2rem 1.5rem;
}
.container {
max-width: 1100px;
margin: 0 auto;
}
h1 {
font-size: 1.1rem;
font-weight: 500;
color: #aaa;
margin-bottom: 0.25rem;
}
.subtitle {
font-size: 0.8rem;
color: #666;
margin-bottom: 1.5rem;
}
.controls {
display: flex;
align-items: center;
gap: 12px;
margin-bottom: 1rem;
flex-wrap: wrap;
}
.controls label {
font-size: 12px;
color: #888;
}
.controls input[type=range] {
width: 180px;
accent-color: #4a7abf;
}
#xmax-label {
font-size: 12px;
font-weight: 500;
color: #ddd;
min-width: 48px;
}
.legend {
display: flex;
flex-wrap: wrap;
gap: 7px;
margin-bottom: 1.25rem;
}
.legend-ctrl {
display: flex;
gap: 6px;
margin-bottom: 0.5rem;
flex-wrap: wrap;
}
.legend-section {
margin-bottom: 0.75rem;
}
.legend-section-title {
font-size: 11px;
color: #888;
margin-bottom: 6px;
text-transform: uppercase;
letter-spacing: 0.5px;
}
button.ctrl-btn {
font-size: 11px;
padding: 3px 12px;
border: 0.5px solid #555;
border-radius: 4px;
background: #1e1e1e;
color: #ccc;
cursor: pointer;
transition: background 0.15s;
}
button.ctrl-btn:hover { background: #2a2a2a; }
button.ctrl-btn.active {
background: #4a7abf;
border-color: #4a7abf;
color: #fff;
}
button.leg-btn {
font-size: 11px;
padding: 3px 10px;
border-radius: 4px;
cursor: pointer;
display: inline-flex;
align-items: center;
gap: 5px;
background: transparent;
color: #ddd;
transition: opacity 0.15s;
}
button.leg-btn .swatch {
width: 10px;
height: 10px;
border-radius: 2px;
flex-shrink: 0;
}
button.leg-btn .version-tag {
font-size: 9px;
color: #888;
background: #2a2a2a;
padding: 1px 4px;
border-radius: 2px;
margin-left: 2px;
}
.chart-wrap {
position: relative;
width: 100%;
height: 520px;
}
@media (max-width: 600px) {
.chart-wrap { height: 380px; }
body { padding: 1rem; }
}
</style>
</head>
<body>
<div class="container">
<h1>VRAM vs Context</h1>
<p class="subtitle">ollama-0.18.0 · B6000</p>
<div class="controls">
<label for="xmax-slider">Max context:</label>
<input type="range" id="xmax-slider" min="1" max="100" step="1" value="100">
<span id="xmax-label"></span>
</div>
<div class="legend-section">
<div class="legend-section-title">Version</div>
<div class="legend-ctrl" id="version-ctrl">
<button class="ctrl-btn active" data-version="all">All</button>
</div>
</div>
<div class="legend-section">
<div class="legend-section-title">Models</div>
<div class="legend-ctrl">
<button class="ctrl-btn" id="btn-all">All</button>
<button class="ctrl-btn" id="btn-none">None</button>
</div>
</div>
<div class="legend" id="legend"></div>
<div class="chart-wrap">
<canvas id="myChart"></canvas>
</div>
</div>
<script src="https://cdnjs.cloudflare.com/ajax/libs/Chart.js/4.4.1/chart.umd.js"></script>
<script>
const raw = [
{ model: "apertus:8b-instruct-2509-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 8327140693, vram: 8327140693, nvram: 7964983296 },
{ model: "apertus:8b-instruct-2509-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 11906280106, vram: 11906280106, nvram: 10112466944 },
{ model: "apertus:8b-instruct-2509-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 15485419520, vram: 15485419520, nvram: 12259950592 },
{ model: "apertus:8b-instruct-2509-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 19064558933, vram: 19064558933, nvram: 14407434240 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 7905732608, vram: 7905732608, nvram: 7879000064 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 11160512512, vram: 11160512512, nvram: 9976152064 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 14415292416, vram: 14415292416, nvram: 12220104704 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 17670072320, vram: 17670072320, nvram: 14367588352 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 20924852224, vram: 20924852224, nvram: 16433283072 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 24179632128, vram: 24179632128, nvram: 18631098368 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 27434412032, vram: 27434412032, nvram: 20828913664 },
{ model: "cogito:8b-v1-preview-llama-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 30689191936, vram: 30689191936, nvram: 23026728960 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 13162129408, vram: 13162129408, nvram: 12891193344 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 17759086592, vram: 17759086592, nvram: 16101933056 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 22356043776, vram: 22356043776, nvram: 19417530368 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 26953000960, vram: 26953000960, nvram: 22638755840 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 31549958144, vram: 31549958144, nvram: 25765609472 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 36146915328, vram: 36146915328, nvram: 29009903616 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 40743872512, vram: 40743872512, nvram: 32281460736 },
{ model: "deepcoder:14b-preview-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 45340829696, vram: 45340829696, nvram: 35553017856 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 6297843712, vram: 6297843712, nvram: 6471811072 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 8210446336, vram: 8210446336, nvram: 7446986752 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 10123048960, vram: 10123048960, nvram: 8300527616 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 12035651584, vram: 12035651584, nvram: 9363783680 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 13948254208, vram: 13948254208, nvram: 10303307776 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 15860856832, vram: 15860856832, nvram: 11133779968 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 17773459456, vram: 17773459456, nvram: 12123635712 },
{ model: "deepseek-r1:7b-qwen-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 19686062080, vram: 19686062080, nvram: 13113491456 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 7880708224, vram: 7880708224, nvram: 8243904512 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 10321793152, vram: 10321793152, nvram: 10682892288 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 12762878080, vram: 12762878080, nvram: 13123977216 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 15229128832, vram: 15229128832, nvram: 15590227968 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 17695379584, vram: 17695379584, nvram: 18056478720 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 20161630336, vram: 20161630336, nvram: 20522729472 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 22627881088, vram: 22627881088, nvram: 22988980224 },
{ model: "deepseek-r1:8b-0528-qwen3-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 25094131840, vram: 25094131840, nvram: 25455230976 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 49538385920, vram: 49538385920, nvram: 48362422272 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 57088133120, vram: 57088133120, nvram: 53831794688 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 64637880320, vram: 64637880320, nvram: 59234058240 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 72187627520, vram: 72187627520, nvram: 64516784128 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 79737374720, vram: 79737374720, nvram: 69935824896 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 87287121920, vram: 87287121920, nvram: 75398905856 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 94836869120, vram: 94836869120, nvram: 80767614976 },
{ model: "deepseek-r1:70b-llama-distill-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 119902031872, vram: 119902031872, nvram: 88820678656 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 17782134784, vram: 17782134784, nvram: 17704157184 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 21573785600, vram: 21573785600, nvram: 20388511744 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 25365436416, vram: 25365436416, nvram: 23119003648 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 29157087232, vram: 29157087232, nvram: 25786580992 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 32948738048, vram: 32948738048, nvram: 28521267200 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 36740388864, vram: 36740388864, nvram: 31188844544 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 40532039680, vram: 40532039680, nvram: 33923530752 },
{ model: "devstral:24b-small-2505-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 44323690496, vram: 44323690496, nvram: 36658216960 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 18761581952, vram: 18761581952, nvram: 19096666112 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 21445936512, vram: 21445936512, nvram: 21778923520 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 24130291072, vram: 24130291072, nvram: 24463278080 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 26814645632, vram: 26814645632, nvram: 27147632640 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 29499000192, vram: 29499000192, nvram: 29831987200 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 32183354752, vram: 32183354752, nvram: 32516341760 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 34867709312, vram: 34867709312, nvram: 35200696320 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 37552063872, vram: 37552063872, nvram: 37885050880 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 40236418432, vram: 40236418432, nvram: 40569405440 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 42920772992, vram: 42920772992, nvram: 43253760000 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 45605127552, vram: 45605127552, nvram: 45938114560 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 48289482112, vram: 48289482112, nvram: 48622469120 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 50973836672, vram: 50973836672, nvram: 51306823680 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 53658191232, vram: 53658191232, nvram: 53991178240 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 56365062272, vram: 56365062272, nvram: 56696504320 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 59099748480, vram: 59099748480, nvram: 59431190528 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 278528, ram: 61834434688, vram: 61834434688, nvram: 62165876736 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 294912, ram: 64569120896, vram: 64569120896, nvram: 64900562944 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 311296, ram: 67303807104, vram: 67303807104, nvram: 67635249152 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 327680, ram: 70038493312, vram: 70038493312, nvram: 70369935360 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 344064, ram: 72773179520, vram: 72773179520, nvram: 73104621568 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 360448, ram: 75507865728, vram: 75507865728, nvram: 75839307776 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 376832, ram: 78242551936, vram: 78242551936, nvram: 78573993984 },
{ model: "devstral-small-2:24b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 393216, ram: 80977238144, vram: 80977238144, nvram: 81308680192 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 81199552640, vram: 81199552640, nvram: 80994107392 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 87147075712, vram: 87147075712, nvram: 86939533312 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 93102987392, vram: 93102987392, nvram: 92891250688 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 99000178816, vram: 99000178816, nvram: 98788442112 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 105310515328, vram: 105310515328, nvram: 105792929792 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 111283204224, vram: 111283204224, nvram: 111767715840 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 117255893120, vram: 117255893120, nvram: 117738307584 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 123228582016, vram: 123228582016, nvram: 123710996480 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 129201270912, vram: 129201270912, nvram: 129683685376 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 135173959808, vram: 135173959808, nvram: 135656374272 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 141146648704, vram: 141146648704, nvram: 141629063168 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 147119337600, vram: 147119337600, nvram: 147599654912 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 153092026496, vram: 153092026496, nvram: 153572343808 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 159064715392, vram: 159064715392, nvram: 159545032704 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 165037404288, vram: 165037404288, nvram: 165517721600 },
{ model: "devstral-2:123b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 171010093184, vram: 171010093184, nvram: 171492507648 },
{ model: "exaone-deep:7.8b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 8109659477, vram: 8109659477, nvram: 7740588032 },
{ model: "exaone-deep:7.8b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 11688798890, vram: 11688798890, nvram: 9835642880 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 16384, ram: 8140180864, vram: 8140180864, nvram: 8514437120 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 32768, ram: 8677051776, vram: 8677051776, nvram: 9055502336 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 49152, ram: 9213922688, vram: 9213922688, nvram: 9590276096 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 65536, ram: 9750793600, vram: 9750793600, nvram: 10125049856 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 81920, ram: 10287664512, vram: 10287664512, nvram: 10666115072 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 98304, ram: 10824535424, vram: 10824535424, nvram: 11198791680 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 114688, ram: 11361406336, vram: 11361406336, nvram: 11737759744 },
{ model: "gemma4:e2b", version: "0.20.2", quant: "Q4_K_M", context: 131072, ram: 11898277248, vram: 11898277248, nvram: 12272533504 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 16384, ram: 11114610688, vram: 11114610688, nvram: 11284774912 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 32768, ram: 11819253760, vram: 11819253760, nvram: 11995709440 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 49152, ram: 12523896832, vram: 12523896832, nvram: 12702449664 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 65536, ram: 13228539904, vram: 13228539904, nvram: 13404995584 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 81920, ram: 13933182976, vram: 13933182976, nvram: 14111735808 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 98304, ram: 14637826048, vram: 14637826048, nvram: 14814281728 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 114688, ram: 15342469120, vram: 15342469120, nvram: 15521021952 },
{ model: "gemma4:e4b", version: "0.20.2", quant: "Q4_K_M", context: 131072, ram: 16047112192, vram: 16047112192, nvram: 16223567872 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 16384, ram: 20779285888, vram: 20779285888, nvram: 20795359232 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 32768, ram: 21953691008, vram: 21953691008, nvram: 21976055808 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 49152, ram: 23128096128, vram: 23128096128, nvram: 23152558080 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 65536, ram: 24302501248, vram: 24302501248, nvram: 24326963200 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 81920, ram: 25476906368, vram: 25476906368, nvram: 25499271168 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 98304, ram: 26651311488, vram: 26651311488, nvram: 26675773440 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 114688, ram: 27825716608, vram: 27825716608, nvram: 27848081408 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 131072, ram: 29000121728, vram: 29000121728, nvram: 29022486528 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 147456, ram: 30174526848, vram: 30174526848, nvram: 30198988800 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 163840, ram: 31348931968, vram: 31348931968, nvram: 31371296768 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 180224, ram: 32523337088, vram: 32523337088, nvram: 32545701888 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 196608, ram: 33697742208, vram: 33697742208, nvram: 33720107008 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 212992, ram: 34872147328, vram: 34872147328, nvram: 34896609280 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 229376, ram: 36046552448, vram: 36046552448, nvram: 36068917248 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 245760, ram: 37220957568, vram: 37220957568, nvram: 37243322368 },
{ model: "gemma4:26b", version: "0.20.2", quant: "Q4_K_M", context: 262144, ram: 38395362688, vram: 38395362688, nvram: 38415630336 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 16384, ram: 27915524736, vram: 27915524736, nvram: 27376222208 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 32768, ram: 30901869184, vram: 30901869184, nvram: 30368858112 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 49152, ram: 33888213632, vram: 33888213632, nvram: 33355202560 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 65536, ram: 36874558080, vram: 36874558080, nvram: 36341547008 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 81920, ram: 39860902528, vram: 39860902528, nvram: 39327891456 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 98304, ram: 42847246976, vram: 42847246976, nvram: 42314235904 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 114688, ram: 45833591424, vram: 45833591424, nvram: 45300580352 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 131072, ram: 48819935872, vram: 48819935872, nvram: 48286924800 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 147456, ram: 51806280320, vram: 51806280320, nvram: 51273269248 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 163840, ram: 54792624768, vram: 54792624768, nvram: 54259613696 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 180224, ram: 57778969216, vram: 57778969216, nvram: 57245958144 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 196608, ram: 60765313664, vram: 60765313664, nvram: 60230205440 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 212992, ram: 63751658112, vram: 63751658112, nvram: 63218647040 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 229376, ram: 66738002560, vram: 66738002560, nvram: 66204991488 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 245760, ram: 69724347008, vram: 69724347008, nvram: 69191335936 },
{ model: "gemma4:31b", version: "0.20.2", quant: "Q4_K_M", context: 262144, ram: 72710691456, vram: 72710691456, nvram: 72177680384 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 20989454208, vram: 20989454208, nvram: 21531459584 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 22698633088, vram: 22698633088, nvram: 23240638464 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 24458143616, vram: 24458143616, nvram: 24995954688 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 26184099712, vram: 26184099712, nvram: 26721910784 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 27910055808, vram: 27910055808, nvram: 28447866880 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 29636011904, vram: 29636011904, nvram: 30173822976 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 31361968000, vram: 31361968000, nvram: 31899779072 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 33087924096, vram: 33087924096, nvram: 33625735168 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 34813880192, vram: 34813880192, nvram: 35351691264 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 36539836288, vram: 36539836288, nvram: 37077647360 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 38265792384, vram: 38265792384, nvram: 38803603456 },
{ model: "glm-4.7-flash:q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 39991748480, vram: 39991748480, nvram: 40529559552 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 16384, ram: 14488221056, vram: 14488221056, nvram: 14082375680 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 32768, ram: 14920365440, vram: 14920365440, nvram: 14512291840 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 49152, ram: 15356573056, vram: 15356573056, nvram: 14948499456 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 65536, ram: 15799989632, vram: 15799989632, nvram: 15390998528 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 81920, ram: 16252974464, vram: 16252974464, nvram: 15843983360 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 98304, ram: 16705959296, vram: 16705959296, nvram: 16296968192 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 114688, ram: 17158944128, vram: 17158944128, nvram: 16749953024 },
{ model: "gpt-oss:20b", version: "0.18.0", quant: "MXFP4", context: 131072, ram: 17611928960, vram: 17611928960, nvram: 17202937856 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 16384, ram: 66322539392, vram: 66322539392, nvram: 65936556032 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 32768, ram: 66956010368, vram: 66956010368, nvram: 66567798784 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 49152, ram: 67593544576, vram: 67593544576, nvram: 67203235840 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 65536, ram: 68238287744, vram: 68238287744, nvram: 67847061504 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 81920, ram: 68892599168, vram: 68892599168, nvram: 68501372928 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 98304, ram: 69546910592, vram: 69546910592, nvram: 69155684352 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 114688, ram: 70201222016, vram: 70201222016, nvram: 69809995776 },
{ model: "gpt-oss:120b", version: "0.18.0", quant: "MXFP4", context: 131072, ram: 70855533440, vram: 70855533440, nvram: 70464307200 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 4556591786, vram: 4556591786, nvram: 4391436288 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 7017250133, vram: 7017250133, nvram: 5788139520 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 9477908480, vram: 9477908480, nvram: 7075790848 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 11938566826, vram: 11938566826, nvram: 8430551040 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 14399225173, vram: 14399225173, nvram: 9823059968 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 16859883520, vram: 16859883520, nvram: 11215568896 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 19320541866, vram: 19320541866, nvram: 12608077824 },
{ model: "granite4:3b", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 21781200213, vram: 21781200213, nvram: 14000586752 },
{ model: "lfm2:24b-q4_k_m", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 15046118016, vram: 15046118016, nvram: 15653142528 },
{ model: "lfm2:24b-q4_k_m", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 15415216768, vram: 15415216768, nvram: 16018046976 },
{ model: "magistral:24b-small-2506-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 17782134784, vram: 17782134784, nvram: 17704157184 },
{ model: "magistral:24b-small-2506-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 21573785600, vram: 21573785600, nvram: 20388511744 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 9201685888, vram: 9201685888, nvram: 9613344768 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 11483387264, vram: 11483387264, nvram: 11892948992 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 13765088640, vram: 13765088640, nvram: 14174650368 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 16046790016, vram: 16046790016, nvram: 16456351744 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 18328491392, vram: 18328491392, nvram: 18738053120 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 20610192768, vram: 20610192768, nvram: 21019754496 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 22891894144, vram: 22891894144, nvram: 23301455872 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 25173595520, vram: 25173595520, nvram: 25583157248 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 27455296896, vram: 27455296896, nvram: 27864858624 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 29736998272, vram: 29736998272, nvram: 30146560000 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 32018699648, vram: 32018699648, nvram: 32428261376 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 34300401024, vram: 34300401024, nvram: 34709962752 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 36582102400, vram: 36582102400, nvram: 36991664128 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 38863803776, vram: 38863803776, nvram: 39273365504 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 41170188416, vram: 41170188416, nvram: 41578135552 },
{ model: "ministral-3:8b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 43502221440, vram: 43502221440, nvram: 43910168576 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 12666733952, vram: 12666733952, nvram: 13002342400 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 15351088512, vram: 15351088512, nvram: 15684599808 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 18035443072, vram: 18035443072, nvram: 18366857216 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 20719797632, vram: 20719797632, nvram: 21051211776 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 23404152192, vram: 23404152192, nvram: 23735566336 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 26088506752, vram: 26088506752, nvram: 26419920896 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 28772861312, vram: 28772861312, nvram: 29104275456 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 31457215872, vram: 31457215872, nvram: 31788630016 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 34141570432, vram: 34141570432, nvram: 34472984576 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 36825924992, vram: 36825924992, nvram: 37157339136 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 39510279552, vram: 39510279552, nvram: 39841693696 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 42194634112, vram: 42194634112, nvram: 42526048256 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 44878988672, vram: 44878988672, nvram: 45210402816 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 47563343232, vram: 47563343232, nvram: 47894757376 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 50270214272, vram: 50270214272, nvram: 50600083456 },
{ model: "ministral-3:14b-instruct-2512-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 53004900480, vram: 53004900480, nvram: 53334769664 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 5468162176, vram: 5468162176, nvram: 6037700608 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 5770152064, vram: 5770152064, nvram: 6339690496 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 6072141952, vram: 6072141952, nvram: 6641680384 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 6374131840, vram: 6374131840, nvram: 6941573120 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 6681233536, vram: 6681233536, nvram: 7251951616 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 7000000640, vram: 7000000640, nvram: 7570718720 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 7318767744, vram: 7318767744, nvram: 7889485824 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 7637534848, vram: 7637534848, nvram: 8208252928 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 7956301952, vram: 7956301952, nvram: 8527020032 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 8275069056, vram: 8275069056, nvram: 8845787136 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 8593836160, vram: 8593836160, nvram: 9164554240 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 8912603264, vram: 8912603264, nvram: 9483321344 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 9231370368, vram: 9231370368, nvram: 9802088448 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 9550137472, vram: 9550137472, nvram: 10120855552 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 9868904576, vram: 9868904576, nvram: 10439622656 },
{ model: "nemotron-3-nano:4b", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 10187671680, vram: 10187671680, nvram: 10758389760 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 25849973760, vram: 25849973760, nvram: 26323451904 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 25984191488, vram: 25984191488, nvram: 26455572480 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 26118409216, vram: 26118409216, nvram: 26589790208 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 26252626944, vram: 26252626944, nvram: 26724007936 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 26394971136, vram: 26394971136, nvram: 26866614272 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 26545966080, vram: 26545966080, nvram: 27017609216 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 26696961024, vram: 26696961024, nvram: 27168604160 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 26847955968, vram: 26847955968, nvram: 27319599104 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 26998950912, vram: 26998950912, nvram: 27470594048 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 27149945856, vram: 27149945856, nvram: 27621588992 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 27300940800, vram: 27300940800, nvram: 27772583936 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 27451935744, vram: 27451935744, nvram: 27923578880 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 27602930688, vram: 27602930688, nvram: 28074573824 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 27753925632, vram: 27753925632, nvram: 28225568768 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 27904920576, vram: 27904920576, nvram: 28376563712 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 28055915520, vram: 28055915520, nvram: 28527558656 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 278528, ram: 28206910464, vram: 28206910464, nvram: 28678553600 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 294912, ram: 28357905408, vram: 28357905408, nvram: 28829548544 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 311296, ram: 28508900352, vram: 28508900352, nvram: 28980543488 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 327680, ram: 28659895296, vram: 28659895296, nvram: 29131538432 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 344064, ram: 28810890240, vram: 28810890240, nvram: 29282533376 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 360448, ram: 28961885184, vram: 28961885184, nvram: 29433528320 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 376832, ram: 29112880128, vram: 29112880128, nvram: 29584523264 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 393216, ram: 29263875072, vram: 29263875072, nvram: 29735518208 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 409600, ram: 29414870016, vram: 29414870016, nvram: 29886513152 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 425984, ram: 29565864960, vram: 29565864960, nvram: 30037508096 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 442368, ram: 29716859904, vram: 29716859904, nvram: 30188503040 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 458752, ram: 29867854848, vram: 29867854848, nvram: 30339497984 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 475136, ram: 30018849792, vram: 30018849792, nvram: 30490492928 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 491520, ram: 30169844736, vram: 30169844736, nvram: 30641487872 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 507904, ram: 30320839680, vram: 30320839680, nvram: 30792482816 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 524288, ram: 30471834624, vram: 30471834624, nvram: 30943477760 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 540672, ram: 30622829568, vram: 30622829568, nvram: 31094472704 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 557056, ram: 30773824512, vram: 30773824512, nvram: 31245467648 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 573440, ram: 30924819456, vram: 30924819456, nvram: 31396462592 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 589824, ram: 31075814400, vram: 31075814400, nvram: 31549554688 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 606208, ram: 31226809344, vram: 31226809344, nvram: 31698452480 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 622592, ram: 31377804288, vram: 31377804288, nvram: 31849447424 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 638976, ram: 31528799232, vram: 31528799232, nvram: 32000442368 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 655360, ram: 31679794176, vram: 31679794176, nvram: 32151437312 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 671744, ram: 31830789120, vram: 31830789120, nvram: 32302432256 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 688128, ram: 31981784064, vram: 31981784064, nvram: 32453427200 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 704512, ram: 32132779008, vram: 32132779008, nvram: 32604422144 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 720896, ram: 32283773952, vram: 32283773952, nvram: 32755417088 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 737280, ram: 32434768896, vram: 32434768896, nvram: 32906412032 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 753664, ram: 32585763840, vram: 32585763840, nvram: 33057406976 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 770048, ram: 32736758784, vram: 32736758784, nvram: 33210499072 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 786432, ram: 32887753728, vram: 32887753728, nvram: 33359396864 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 802816, ram: 33038748672, vram: 33038748672, nvram: 33510391808 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 819200, ram: 33189743616, vram: 33189743616, nvram: 33661386752 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 835584, ram: 33340738560, vram: 33340738560, nvram: 33812381696 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 851968, ram: 33491733504, vram: 33491733504, nvram: 33963376640 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 868352, ram: 33642728448, vram: 33642728448, nvram: 34114371584 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 884736, ram: 33793723392, vram: 33793723392, nvram: 34265366528 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 901120, ram: 33944718336, vram: 33944718336, nvram: 34416361472 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 917504, ram: 34095713280, vram: 34095713280, nvram: 34567356416 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 933888, ram: 34246708224, vram: 34246708224, nvram: 34718351360 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 950272, ram: 34397703168, vram: 34397703168, nvram: 34869346304 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 966656, ram: 34548698112, vram: 34548698112, nvram: 35020341248 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 983040, ram: 34699693056, vram: 34699693056, nvram: 35171336192 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 999424, ram: 34850688000, vram: 34850688000, nvram: 35473326080 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 1015808, ram: 35001682944, vram: 35001682944, nvram: 35624321024 },
{ model: "nemotron-3-nano:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 1032192, ram: 35152677888, vram: 35152677888, nvram: 35624321024 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 91701882624, vram: 91701882624, nvram: 92121595904 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 91886432000, vram: 91886432000, nvram: 92301950976 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 92070981376, vram: 92070981376, nvram: 92484403200 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 92188421888, vram: 92188421888, nvram: 92601843712 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 92356194048, vram: 92356194048, nvram: 92767518720 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 92523966208, vram: 92523966208, nvram: 92931096576 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 92691738368, vram: 92691738368, nvram: 93096771584 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 92859510528, vram: 92859510528, nvram: 93264543744 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 93027282688, vram: 93027282688, nvram: 93432315904 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 93195054848, vram: 93195054848, nvram: 93600088064 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 93362827008, vram: 93362827008, nvram: 93767860224 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 93530599168, vram: 93530599168, nvram: 93935632384 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 93698371328, vram: 93698371328, nvram: 94103404544 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 93866143488, vram: 93866143488, nvram: 94271176704 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 94043352832, vram: 94043352832, nvram: 94449434624 },
{ model: "nemotron-3-super:120b-a12b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 94227902208, vram: 94227902208, nvram: 94633984000 },
{ model: "olmo-3.1:32b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 21837228544, vram: 21837228544, nvram: 22359834624 },
{ model: "olmo-3.1:32b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 22927747584, vram: 22927747584, nvram: 23450353664 },
{ model: "olmo-3.1:32b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 24035043840, vram: 24035043840, nvram: 24553455616 },
{ model: "olmo-3.1:32b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 25142340096, vram: 25142340096, nvram: 25660751872 },
{ model: "qwen2.5-coder:7b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 6297843712, vram: 6297843712, nvram: 6469713920 },
{ model: "qwen2.5-coder:7b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 8210446336, vram: 8210446336, nvram: 7442792448 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 20356380800, vram: 20356380800, nvram: 20898119680 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 22038296704, vram: 22038296704, nvram: 22580035584 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 23665686656, vram: 23665686656, nvram: 24205328384 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 25326631040, vram: 25326631040, nvram: 25866272768 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 26987575424, vram: 26987575424, nvram: 27527217152 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 28648519808, vram: 28648519808, nvram: 29188161536 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 30309464192, vram: 30309464192, nvram: 30849105920 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 31970408576, vram: 31970408576, nvram: 32510050304 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 33631352960, vram: 33631352960, nvram: 34170994688 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 35292297344, vram: 35292297344, nvram: 35831939072 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 36953241728, vram: 36953241728, nvram: 37492883456 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 38614186112, vram: 38614186112, nvram: 39153827840 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 40275130496, vram: 40275130496, nvram: 40814772224 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 41936074880, vram: 41936074880, nvram: 42475716608 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 43597019264, vram: 43597019264, nvram: 44136660992 },
{ model: "qwen3-coder:30b-a3b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 45257963648, vram: 45257963648, nvram: 45797605376 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 9237766784, vram: 9237766784, nvram: 9330229248 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 9939657344, vram: 9939657344, nvram: 10030678016 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 10675790464, vram: 10675790464, nvram: 10766778368 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 11411923584, vram: 11411923584, nvram: 11502878720 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 12148056704, vram: 12148056704, nvram: 12238979072 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 12884189824, vram: 12884189824, nvram: 12975079424 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 13620322944, vram: 13620322944, nvram: 13711179776 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 14356456064, vram: 14356456064, nvram: 14447280128 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 15092589184, vram: 15092589184, nvram: 15183380480 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 15828722304, vram: 15828722304, nvram: 15919480832 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 16564855424, vram: 16564855424, nvram: 16657678336 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 17300988544, vram: 17300988544, nvram: 17393778688 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 18037121664, vram: 18037121664, nvram: 18129879040 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 18773254784, vram: 18773254784, nvram: 18865979392 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 19509387904, vram: 19509387904, nvram: 19602079744 },
{ model: "qwen3.5:9b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 20245521024, vram: 20245521024, nvram: 20338180096 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 9362191872, vram: 9362191872, nvram: 9661579264 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 11877692928, vram: 11877692928, nvram: 12178161664 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 14393193984, vram: 14393193984, nvram: 14692646912 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 17008276992, vram: 17008276992, nvram: 17307795456 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 19623360000, vram: 19623360000, nvram: 19922944000 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 22238443008, vram: 22238443008, nvram: 22538092544 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 24853526016, vram: 24853526016, nvram: 25153241088 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 27468609024, vram: 27468609024, nvram: 27768389632 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 30083692032, vram: 30083692032, nvram: 30383538176 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 32698775040, vram: 32698775040, nvram: 32998686720 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 35313858048, vram: 35313858048, nvram: 35613835264 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 37928941056, vram: 37928941056, nvram: 38228983808 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 212992, ram: 40544024064, vram: 40544024064, nvram: 40844132352 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 229376, ram: 43159107072, vram: 43159107072, nvram: 43459280896 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 245760, ram: 45774190080, vram: 45774190080, nvram: 46074429440 },
{ model: "qwen3-vl:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 262144, ram: 48389273088, vram: 48389273088, nvram: 48689577984 },
{ model: "rnj-1:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 7988582528, vram: 7988582528, nvram: 8269070336 },
{ model: "rnj-1:8b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 10178009216, vram: 10178009216, nvram: 10460594176 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 259697554688, vram: 259697554688, nvram: 153998065664 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 328349922560, vram: 328349922560, nvram: 179006603264 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 384520041728, vram: 384520041728, nvram: 184132042752 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 440690160896, vram: 398052411264, nvram: 150223192064 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 496860280064, vram: 397053472512, nvram: 111430074368 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 553030399232, vram: 395859299584, nvram: 76359401472 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 609200518400, vram: 394996973952, nvram: 36081500160 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 665370637568, vram: 399431958528, nvram: 5230297088 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 721540756736, vram: 449360953344, nvram: 5347737600 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 777710875904, vram: 499289948160, nvram: 5465178112 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 833880995072, vram: 549218942976, nvram: 5582618624 },
// { model: "frob/glm-4.7:358b-a32b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 890051114240, vram: 599147937792, nvram: 5700059136 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 30593792000, vram: 30593792000, nvram: 30198988800 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 37338232832, vram: 37338232832, nvram: 35592863744 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 44082673664, vram: 44082673664, nvram: 41011904512 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 50827114496, vram: 50827114496, nvram: 46374322176 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 57571555328, vram: 57571555328, nvram: 51793362944 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 64315996160, vram: 64315996160, nvram: 57155780608 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 71060436992, vram: 71060436992, nvram: 62574821376 },
{ model: "frob/iquest-coder:40b-instruct-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 77804877824, vram: 77804877824, nvram: 67993862144 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 16384, ram: 150470634496, vram: 150470634496, nvram: 144479092736 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 32768, ram: 162952883200, vram: 162952883200, nvram: 74966892544 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 49152, ram: 175435131904, vram: 175435131904, nvram: 153255673856 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 65536, ram: 187917380608, vram: 187917380608, nvram: 79362523136 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 81920, ram: 221203377152, vram: 221203377152, nvram: 110169686016 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 98304, ram: 237846375424, vram: 237846375424, nvram: 113122476032 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 114688, ram: 254489373696, vram: 254489373696, nvram: 116075266048 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 131072, ram: 271132371968, vram: 271132371968, nvram: 119028056064 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 147456, ram: 287775370240, vram: 287775370240, nvram: 121980846080 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 163840, ram: 346025864192, vram: 346025864192, nvram: 140469338112 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 180224, ram: 366829612032, vram: 366829612032, nvram: 143774449664 },
// { model: "frob/minimax-m2.5:230b-a10b-q4_K_M", version: "0.18.0", quant: "Q4_K_M", context: 196608, ram: 387633359872, vram: 383945237504, nvram: 141048152064 },
];
const palette = [
"#3266ad","#c85250","#4e9a51","#9b6db5","#d17a2f",
"#5baab0","#b55e8c","#7b7b2a","#4a7abf","#e06060",
"#45a087","#d4aa44","#888888","#c07840","#6644aa",
"#2e8b8b","#a04060","#3a9ad4"
];
// Get unique versions
const versions = [...new Set(raw.map(r => r.version))].sort();
// Get unique models
const models = [...new Set(raw.map(r => r.model))];
// Current filter state
let selectedVersion = 'all';
// Create datasets with version info
const datasets = models.map((m, i) => {
const pts = raw.filter(r => r.model === m).sort((a, b) => a.context - b.context);
const modelVersion = pts[0]?.version || 'unknown';
return {
label: m,
version: modelVersion,
data: pts.map(p => ({ x: p.context / 1024, y: +(p.ram / 1e9).toFixed(2) })),
borderColor: palette[i % palette.length],
backgroundColor: palette[i % palette.length],
borderWidth: 2,
pointRadius: 3,
pointHoverRadius: 5,
tension: 0.3,
fill: false,
};
});
const allContextsK = [...new Set(raw.map(r => r.context / 1024))].sort((a, b) => a - b);
const maxSteps = allContextsK.length;
const slider = document.getElementById('xmax-slider');
const xmaxLabel = document.getElementById('xmax-label');
slider.min = 1;
slider.max = maxSteps;
slider.value = maxSteps;
function formatK(k) {
return k >= 1024 ? (k / 1024).toFixed(1).replace(/\.0$/, '') + 'M' : Math.round(k) + 'K';
}
function getXMax() {
return allContextsK[parseInt(slider.value) - 1];
}
xmaxLabel.textContent = formatK(getXMax());
// Create version selector buttons
const versionCtrlEl = document.getElementById('version-ctrl');
versions.forEach(ver => {
const btn = document.createElement('button');
btn.className = 'ctrl-btn';
btn.textContent = ver;
btn.dataset.version = ver;
btn.addEventListener('click', () => selectVersion(ver));
versionCtrlEl.appendChild(btn);
});
// Add event listener for the "All" button
document.querySelector('#version-ctrl .ctrl-btn[data-version="all"]').addEventListener('click', () => selectVersion('all'));
function selectVersion(version) {
selectedVersion = version;
// Update button states
document.querySelectorAll('#version-ctrl .ctrl-btn').forEach(btn => {
btn.classList.toggle('active', btn.dataset.version === version);
});
// Filter datasets
datasets.forEach((ds, i) => {
const shouldShow = version === 'all' || ds.version === version;
ds.hidden = !shouldShow;
});
// Update legend visibility
const legendButtons = document.querySelectorAll('.leg-btn');
legendButtons.forEach((btn, i) => {
const ds = datasets[i];
btn.style.display = (selectedVersion === 'all' || ds.version === selectedVersion) ? 'inline-flex' : 'none';
btn.style.opacity = ds.hidden ? '0.3' : '1';
});
chart.update();
}
const chart = new Chart(document.getElementById('myChart'), {
type: 'line',
data: { datasets },
options: {
responsive: true,
maintainAspectRatio: false,
interaction: { mode: 'nearest', intersect: false, axis: 'xy' },
plugins: {
legend: { display: false },
title: { display: false },
tooltip: {
mode: 'nearest',
intersect: false,
backgroundColor: '#1e1e1e',
borderColor: '#444',
borderWidth: 1,
titleColor: '#aaa',
bodyColor: '#ddd',
callbacks: {
title: items => 'Context: ' + formatK(items[0].parsed.x) + ' tokens',
label: item => ' ' + item.dataset.label + ': ' + item.parsed.y.toFixed(1) + ' GB'
}
}
},
scales: {
x: {
type: 'linear',
min: 0,
max: getXMax(),
title: { display: true, text: 'Context (K tokens)', color: '#666', font: { size: 12 } },
ticks: { color: '#666', callback: v => formatK(v) },
grid: { color: 'rgba(255,255,255,0.06)' },
border: { color: '#333' }
},
y: {
title: { display: true, text: 'VRAM (GB)', color: '#666', font: { size: 12 } },
ticks: { color: '#666', callback: v => v + ' GB' },
grid: { color: 'rgba(255,255,255,0.06)' },
border: { color: '#333' }
}
}
}
});
slider.addEventListener('input', () => {
const xmax = getXMax();
xmaxLabel.textContent = formatK(xmax);
chart.options.scales.x.max = xmax;
chart.update();
});
const legendEl = document.getElementById('legend');
document.getElementById('btn-all').addEventListener('click', () => {
datasets.forEach((ds, i) => {
const shouldShow = selectedVersion === 'all' || ds.version === selectedVersion;
ds.hidden = !shouldShow;
});
chart.update();
document.querySelectorAll('.leg-btn').forEach((b, i) => {
const ds = datasets[i];
const shouldShow = selectedVersion === 'all' || ds.version === selectedVersion;
b.style.opacity = shouldShow ? '1' : '0.3';
});
});
document.getElementById('btn-none').addEventListener('click', () => {
datasets.forEach(ds => ds.hidden = true);
chart.update();
document.querySelectorAll('.leg-btn').forEach(b => b.style.opacity = '0.3');
});
datasets.forEach((ds, i) => {
const btn = document.createElement('button');
btn.className = 'leg-btn';
btn.style.border = '0.5px solid ' + ds.borderColor;
btn.innerHTML = '<span class="swatch" style="background:' + ds.borderColor + '"></span>' + ds.label + '<span class="version-tag">' + ds.version + '</span>';
btn.addEventListener('click', () => {
ds.hidden = !ds.hidden;
btn.style.opacity = ds.hidden ? '0.3' : '1';
chart.update();
});
legendEl.appendChild(btn);
});
</script>
</body>
</html>