Separate model and feature support matrices by category (#1100)

boe20211 · boe20211 · commit 5ccc67166cf3 · 2025-11-17T10:16:31.000+08:00
Signed-off-by: Teresa Chen &lt;boe20211@gmail.com&gt;
diff --git a/.buildkite/features/JAX-Path_Qxix_Quantization.yml b/.buildkite/features/JAX-Path_Qxix_Quantization.yml
@@ -1,29 +1,30 @@
 # JAX-Path Qxix Quantization
 # feature support matrix
 steps:
-  # - label: "Correctness tests for JAX-Path Qxix Quantization"
-  #   key: "JAX-Path_Qxix_Quantization_CorrectnessTest"
-  #   soft_fail: true
-  #   agents:
-  #     queue: tpu_v6e_queue
-  #   commands:
-  #     - echo "covered by performance tests"
-  # - label: "Record correctness test result for JAX-Path Qxix Quantization"
-  #   key: "record_JAX-Path_Qxix_Quantization_CorrectnessTest"
-  #   depends_on: "JAX-Path_Qxix_Quantization_CorrectnessTest"
-  #   env:
-  #     CI_TARGET: "JAX-Path Qxix Quantization"
-  #     CI_STAGE: "CorrectnessTest"
-  #     CI_CATEGORY: "feature support matrix"
-  #   agents:
-  #     queue: cpu
-  #   commands:
-  #     - |
-  #       .buildkite/scripts/record_step_result.sh JAX-Path_Qxix_Quantization_CorrectnessTest
+  - label: "Correctness tests for JAX-Path Qxix Quantization"
+    key: "JAX-Path_Qxix_Quantization_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "JAX-Path Qxix Quantization:CorrectnessTest" "to be added"
+  - label: "Record correctness test result for JAX-Path Qxix Quantization"
+    key: "record_JAX-Path_Qxix_Quantization_CorrectnessTest"
+    depends_on: "JAX-Path_Qxix_Quantization_CorrectnessTest"
+    env:
+      CI_TARGET: "JAX-Path Qxix Quantization"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "feature support matrix"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh JAX-Path_Qxix_Quantization_CorrectnessTest
 
   - label: "Performance tests for JAX-Path Qxix Quantization"
     key: "JAX-Path_Qxix_Quantization_PerformanceTest"
-    # depends_on: "record_JAX-Path_Qxix_Quantization_CorrectnessTest"
+    depends_on: "record_JAX-Path_Qxix_Quantization_CorrectnessTest"
     soft_fail: true
     env:
       QUANTIZATION: "True"
diff --git a/.buildkite/features/Quantized_Matmul_Attention_and_KV_Cache.yml b/.buildkite/features/Quantized_Matmul_Attention_and_KV_Cache.yml
@@ -1,29 +1,30 @@
 # Quantized Matmul Attention and KV Cache
 # kernel support matrix
 steps:
-  # - label: "Correctness tests for Quantized Matmul Attention and KV Cache"
-  #   key: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
-  #   soft_fail: true
-  #   agents:
-  #     queue: cpu
-  #   commands:
-  #     - echo "covered by performance test"
-  # - label: "Record correctness test result for Quantized Matmul Attention and KV Cache"
-  #   key: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
-  #   depends_on: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
-  #   env:
-  #     CI_TARGET: "Quantized Matmul Attention and KV Cache"
-  #     CI_STAGE: "CorrectnessTest"
-  #     CI_CATEGORY: "kernel support matrix"
-  #   agents:
-  #     queue: cpu
-  #   commands:
-  #     - |
-  #       .buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest
+  - label: "Correctness tests for Quantized Matmul Attention and KV Cache"
+    key: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: cpu
+    commands:
+      - |
+        buildkite-agent meta-data set "Quantized Matmul Attention and KV Cache:CorrectnessTest" "to be added"
+  - label: "Record correctness test result for Quantized Matmul Attention and KV Cache"
+    key: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
+    depends_on: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
+    env:
+      CI_TARGET: "Quantized Matmul Attention and KV Cache"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest
 
   - label: "Performance tests for Quantized Matmul Attention and KV Cache"
     key: "Quantized_Matmul_Attention_and_KV_Cache_PerformanceTest"
-    # depends_on: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
+    depends_on: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
     soft_fail: true
     agents:
       queue: tpu_v6e_8_queue
diff --git a/.buildkite/parallelism/CP.yml b/.buildkite/parallelism/CP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "CP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for CP"
     key: "record_CP_CorrectnessTest"
     depends_on: "CP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "CP:PerformanceTest" "to be added"
   - label: "Record performance test result for CP"
     key: "record_CP_PerformanceTest"
     depends_on: "CP_PerformanceTest"
diff --git a/.buildkite/parallelism/DP.yml b/.buildkite/parallelism/DP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "DP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for DP"
     key: "record_DP_CorrectnessTest"
     depends_on: "DP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "DP:PerformanceTest" "to be added"
   - label: "Record performance test result for DP"
     key: "record_DP_PerformanceTest"
     depends_on: "DP_PerformanceTest"
diff --git a/.buildkite/parallelism/EP.yml b/.buildkite/parallelism/EP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "EP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for EP"
     key: "record_EP_CorrectnessTest"
     depends_on: "EP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "EP:PerformanceTest" "to be added"
   - label: "Record performance test result for EP"
     key: "record_EP_PerformanceTest"
     depends_on: "EP_PerformanceTest"
diff --git a/.buildkite/parallelism/PP.yml b/.buildkite/parallelism/PP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "PP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for PP"
     key: "record_PP_CorrectnessTest"
     depends_on: "PP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "PP:PerformanceTest" "to be added"
   - label: "Record performance test result for PP"
     key: "record_PP_PerformanceTest"
     depends_on: "PP_PerformanceTest"
diff --git a/.buildkite/parallelism/SP.yml b/.buildkite/parallelism/SP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "SP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for SP"
     key: "record_SP_CorrectnessTest"
     depends_on: "SP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "SP:PerformanceTest" "to be added"
   - label: "Record performance test result for SP"
     key: "record_SP_PerformanceTest"
     depends_on: "SP_PerformanceTest"
diff --git a/.buildkite/parallelism/TP.yml b/.buildkite/parallelism/TP.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "TP:CorrectnessTest" "to be added"
   - label: "Record correctness test result for TP"
     key: "record_TP_CorrectnessTest"
     depends_on: "TP_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "TP:PerformanceTest" "to be added"
   - label: "Record performance test result for TP"
     key: "record_TP_PerformanceTest"
     depends_on: "TP_PerformanceTest"
diff --git a/.buildkite/quantization/AWQ_INT4.yml b/.buildkite/quantization/AWQ_INT4.yml
@@ -6,8 +6,9 @@ steps:
     soft_fail: true
     agents:
       queue: tpu_v6e_queue
-    commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+    commands: 
+      - |
+        buildkite-agent meta-data set "AWQ INT4:CorrectnessTest" "to be added"
   - label: "Record correctness test result for AWQ INT4"
     key: "record_AWQ_INT4_CorrectnessTest"
     depends_on: "AWQ_INT4_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "AWQ INT4:PerformanceTest" "to be added"
   - label: "Record performance test result for AWQ INT4"
     key: "record_AWQ_INT4_PerformanceTest"
     depends_on: "AWQ_INT4_PerformanceTest"
diff --git a/.buildkite/quantization/FP4_W4A16.yml b/.buildkite/quantization/FP4_W4A16.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "FP4 W4A16:CorrectnessTest" "to be added"
   - label: "Record correctness test result for FP4 W4A16"
     key: "record_FP4_W4A16_CorrectnessTest"
     depends_on: "FP4_W4A16_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "FP4 W4A16:PerformanceTest" "to be added"
   - label: "Record performance test result for FP4 W4A16"
     key: "record_FP4_W4A16_PerformanceTest"
     depends_on: "FP4_W4A16_PerformanceTest"
diff --git a/.buildkite/quantization/FP8_W8A16.yml b/.buildkite/quantization/FP8_W8A16.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "FP8 W8A16:CorrectnessTest" "to be added"
   - label: "Record correctness test result for FP8 W8A16"
     key: "record_FP8_W8A16_CorrectnessTest"
     depends_on: "FP8_W8A16_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "FP8 W8A16:PerformanceTest" "to be added"
   - label: "Record performance test result for FP8 W8A16"
     key: "record_FP8_W8A16_PerformanceTest"
     depends_on: "FP8_W8A16_PerformanceTest"
diff --git a/.buildkite/quantization/FP8_W8A8.yml b/.buildkite/quantization/FP8_W8A8.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "FP8 W8A8:CorrectnessTest" "to be added"
   - label: "Record correctness test result for FP8 W8A8"
     key: "record_FP8_W8A8_CorrectnessTest"
     depends_on: "FP8_W8A8_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "FP8 W8A8:PerformanceTest" "to be added"
   - label: "Record performance test result for FP8 W8A8"
     key: "record_FP8_W8A8_PerformanceTest"
     depends_on: "FP8_W8A8_PerformanceTest"
diff --git a/.buildkite/quantization/INT4_W4A16.yml b/.buildkite/quantization/INT4_W4A16.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "INT4 W4A16:CorrectnessTest" "to be added"
   - label: "Record correctness test result for INT4 W4A16"
     key: "record_INT4_W4A16_CorrectnessTest"
     depends_on: "INT4_W4A16_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "INT4 W4A16:PerformanceTest" "to be added"
   - label: "Record performance test result for INT4 W4A16"
     key: "record_INT4_W4A16_PerformanceTest"
     depends_on: "INT4_W4A16_PerformanceTest"
diff --git a/.buildkite/quantization/INT8_W8A8.yml b/.buildkite/quantization/INT8_W8A8.yml
@@ -7,7 +7,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your correctness test command
+      - |
+        buildkite-agent meta-data set "INT8 W8A8:CorrectnessTest" "to be added"
   - label: "Record correctness test result for INT8 W8A8"
     key: "record_INT8_W8A8_CorrectnessTest"
     depends_on: "INT8_W8A8_CorrectnessTest"
@@ -28,7 +29,8 @@ steps:
     agents:
       queue: tpu_v6e_queue
     commands:
-      - echo "placeholder"  # TODO : replace with your performance test command
+      - |
+        buildkite-agent meta-data set "INT8 W8A8:PerformanceTest" "to be added"
   - label: "Record performance test result for INT8 W8A8"
     key: "record_INT8_W8A8_PerformanceTest"
     depends_on: "INT8_W8A8_PerformanceTest"
diff --git a/.buildkite/scripts/upload_models_and_features.sh b/.buildkite/scripts/upload_models_and_features.sh
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 BUILDKITE_DIR=".buildkite"
-TARGET_FOLDERS="models features parallelism quatization"
+TARGET_FOLDERS="models features parallelism quantization"
 MODEL_LIST_KEY="model-list"
 FEATURE_LIST_KEY="feature-list"
 
@@ -43,7 +43,7 @@ for folder_path in $TARGET_FOLDERS; do
         "parallelism")
           feature_list+=("${subject_name}")
           ;;
-        "quatization")
+        "quantization")
           feature_list+=("${subject_name}")
           ;;
       esac