We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0837dc0 commit ee0085bCopy full SHA for ee0085b
.github/scripts/generate_vllm_benchmark_matrix.py
@@ -71,6 +71,7 @@
71
],
72
"meta-llama/Meta-Llama-3.1-70B-Instruct": [
73
"linux.dgx.b200",
74
+ "linux.rocm.gpu.gfx942", # TODO: Fail on ROCm
75
76
"mistralai/Mixtral-8x7B-Instruct-v0.1": [
77
@@ -86,6 +87,7 @@
86
87
"Qwen/Qwen3-30B-A3B": [
88
"linux.aws.a100",
89
"linux.aws.h100",
90
91
92
"google/gemma-3-27b-it": [
93
@@ -95,6 +97,7 @@
95
97
"meta-llama/Llama-4-Scout-17B-16E-Instruct": [
96
98
99
100
101
102
"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": [
103
0 commit comments