Skip some models on ROCm (#85)

huydhn · web-flow · commit ee0085be0bfe · 2025-10-01T17:06:11.000-07:00
Signed-off-by: Huy Do &lt;huydhn@gmail.com&gt;
diff --git a/.github/scripts/generate_vllm_benchmark_matrix.py b/.github/scripts/generate_vllm_benchmark_matrix.py
@@ -71,6 +71,7 @@
     ],
     "meta-llama/Meta-Llama-3.1-70B-Instruct": [
         "linux.dgx.b200",
+        "linux.rocm.gpu.gfx942",  # TODO: Fail on ROCm
     ],
     "mistralai/Mixtral-8x7B-Instruct-v0.1": [
         "linux.dgx.b200",
@@ -86,6 +87,7 @@
     "Qwen/Qwen3-30B-A3B": [
         "linux.aws.a100",
         "linux.aws.h100",
+        "linux.rocm.gpu.gfx942",  # TODO: Fail on ROCm
     ],
     "google/gemma-3-27b-it": [
         "linux.aws.a100",
@@ -95,6 +97,7 @@
     "meta-llama/Llama-4-Scout-17B-16E-Instruct": [
         "linux.aws.a100",
         "linux.aws.h100",
+        "linux.rocm.gpu.gfx942",  # TODO: Fail on ROCm
     ],
     "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": [
         "linux.aws.a100",