|
965 | 965 | - config-keys: |
966 | 966 | # NVIDIA single-node |
967 | 967 | - dsr1-fp4-b200-sglang |
968 | | - - dsr1-fp4-b200-trt |
969 | | - - dsr1-fp4-b200-trt-mtp |
970 | | - - dsr1-fp8-b200-sglang |
971 | | - - dsr1-fp8-b200-sglang-mtp |
972 | | - - dsr1-fp8-b200-trt |
973 | | - - dsr1-fp8-b200-trt-mtp |
974 | | - - dsr1-fp8-h200-sglang |
975 | | - - dsr1-fp8-h200-trt |
976 | | - - dsr1-fp8-h200-trt-mtp |
977 | | - - gptoss-fp4-b200-trt |
978 | | - - gptoss-fp4-b200-vllm |
979 | | - - gptoss-fp4-h100-vllm |
980 | | - - gptoss-fp4-h200-trt |
981 | | - - gptoss-fp4-h200-vllm |
982 | | - - kimik2.5-fp4-b200-vllm |
983 | | - - kimik2.5-int4-b200-vllm |
984 | | - - kimik2.5-int4-h200-vllm |
985 | | - - minimaxm2.5-fp8-b200-vllm |
986 | | - - minimaxm2.5-fp8-h100-vllm |
987 | | - - minimaxm2.5-fp8-h200-vllm |
988 | | - - qwen3.5-bf16-b200-sglang |
989 | | - - qwen3.5-fp8-b200-sglang |
990 | | - - qwen3.5-fp8-h200-sglang |
991 | 968 | # AMD single-node |
992 | | - - dsr1-fp4-mi355x-atom |
993 | 969 | - dsr1-fp4-mi355x-atom-mtp |
994 | | - - dsr1-fp4-mi355x-sglang |
995 | | - - dsr1-fp8-mi300x-sglang |
996 | | - - dsr1-fp8-mi325x-sglang |
997 | | - - dsr1-fp8-mi355x-atom |
998 | | - - dsr1-fp8-mi355x-atom-mtp |
999 | | - - dsr1-fp8-mi355x-sglang |
1000 | | - - glm5-fp8-mi355x-sglang |
1001 | | - - gptoss-fp4-mi300x-vllm |
1002 | | - - gptoss-fp4-mi325x-vllm |
1003 | | - - gptoss-fp4-mi355x-atom |
1004 | | - - gptoss-fp4-mi355x-vllm |
1005 | | - - kimik2.5-fp4-mi355x-vllm |
1006 | | - - kimik2.5-int4-mi325x-vllm |
1007 | | - - kimik2.5-int4-mi355x-vllm |
1008 | | - - minimaxm2.5-fp8-mi300x-vllm |
1009 | | - - minimaxm2.5-fp8-mi325x-vllm |
1010 | | - - minimaxm2.5-fp8-mi355x-vllm |
1011 | | - - qwen3.5-bf16-mi300x-sglang |
1012 | | - - qwen3.5-bf16-mi325x-sglang |
1013 | | - - qwen3.5-bf16-mi355x-sglang |
1014 | | - - qwen3.5-fp8-mi300x-sglang |
1015 | | - - qwen3.5-fp8-mi325x-sglang |
1016 | | - - qwen3.5-fp8-mi355x-sglang |
1017 | 970 | description: |
1018 | 971 | - "Separate evals, change to 8k1k" |
1019 | 972 | pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/911 |
1020 | | - evals-only: true |
0 commit comments