|
1 | 1 | # Quantized Matmul Attention and KV Cache |
2 | 2 | # kernel support matrix |
3 | 3 | steps: |
4 | | - # - label: "Correctness tests for Quantized Matmul Attention and KV Cache" |
5 | | - # key: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
6 | | - # soft_fail: true |
7 | | - # agents: |
8 | | - # queue: cpu |
9 | | - # commands: |
10 | | - # - echo "covered by performance test" |
11 | | - # - label: "Record correctness test result for Quantized Matmul Attention and KV Cache" |
12 | | - # key: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
13 | | - # depends_on: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
14 | | - # env: |
15 | | - # CI_TARGET: "Quantized Matmul Attention and KV Cache" |
16 | | - # CI_STAGE: "CorrectnessTest" |
17 | | - # CI_CATEGORY: "kernel support matrix" |
18 | | - # agents: |
19 | | - # queue: cpu |
20 | | - # commands: |
21 | | - # - | |
22 | | - # .buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest |
| 4 | + - label: "Correctness tests for Quantized Matmul Attention and KV Cache" |
| 5 | + key: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
| 6 | + soft_fail: true |
| 7 | + agents: |
| 8 | + queue: cpu |
| 9 | + commands: |
| 10 | + - | |
| 11 | + buildkite-agent meta-data set "Quantized Matmul Attention and KV Cache:CorrectnessTest" "to be added" |
| 12 | + - label: "Record correctness test result for Quantized Matmul Attention and KV Cache" |
| 13 | + key: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
| 14 | + depends_on: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
| 15 | + env: |
| 16 | + CI_TARGET: "Quantized Matmul Attention and KV Cache" |
| 17 | + CI_STAGE: "CorrectnessTest" |
| 18 | + CI_CATEGORY: "kernel support matrix" |
| 19 | + agents: |
| 20 | + queue: cpu |
| 21 | + commands: |
| 22 | + - | |
| 23 | + .buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest |
23 | 24 |
|
24 | 25 | - label: "Performance tests for Quantized Matmul Attention and KV Cache" |
25 | 26 | key: "Quantized_Matmul_Attention_and_KV_Cache_PerformanceTest" |
26 | | - # depends_on: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
| 27 | + depends_on: "record_Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest" |
27 | 28 | soft_fail: true |
28 | 29 | agents: |
29 | 30 | queue: tpu_v6e_8_queue |
|
0 commit comments