vllm-project
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w16a16.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w16a16.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a16.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a16.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a4.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a4.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a8.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w4a8.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w8a16.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w8a16.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w8a8.yml‎
Lines changed: 45 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/all_gather_matmul/w8a8.yml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/for_attention_kernels_KV_cache/w16a16.yml‎
Lines changed: 46 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/for_attention_kernels_KV_cache/w16a16.yml‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎.buildkite/kernel_microbenchmarks/for_attention_kernels_KV_cache/w4a16.yml‎
Lines changed: 46 additions & 0 deletions b/‎.buildkite/kernel_microbenchmarks/for_attention_kernels_KV_cache/w4a16.yml‎
Lines changed: 46 additions & 0 deletions
@@ -0,0 +1,45 @@
+# all-gather-matmul-w16a16
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w16a16"
+    key: "all-gather-matmul-w16a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w16a16_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w16a16"
+    key: "record_all-gather-matmul-w16a16_CorrectnessTest"
+    depends_on: "all-gather-matmul-w16a16_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w16a16"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w16a16_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w16a16"
+    key: "all-gather-matmul-w16a16_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w16a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w16a16_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w16a16"
+    key: "record_all-gather-matmul-w16a16_PerformanceTest"
+    depends_on: "all-gather-matmul-w16a16_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w16a16"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w16a16_PerformanceTest
@@ -0,0 +1,45 @@
+# all-gather-matmul-w4a16
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w4a16"
+    key: "all-gather-matmul-w4a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a16_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w4a16"
+    key: "record_all-gather-matmul-w4a16_CorrectnessTest"
+    depends_on: "all-gather-matmul-w4a16_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a16"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a16_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w4a16"
+    key: "all-gather-matmul-w4a16_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w4a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a16_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w4a16"
+    key: "record_all-gather-matmul-w4a16_PerformanceTest"
+    depends_on: "all-gather-matmul-w4a16_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a16"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a16_PerformanceTest
@@ -0,0 +1,45 @@
+# all-gather-matmul-w4a4
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w4a4"
+    key: "all-gather-matmul-w4a4_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a4_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w4a4"
+    key: "record_all-gather-matmul-w4a4_CorrectnessTest"
+    depends_on: "all-gather-matmul-w4a4_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a4"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a4_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w4a4"
+    key: "all-gather-matmul-w4a4_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w4a4_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a4_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w4a4"
+    key: "record_all-gather-matmul-w4a4_PerformanceTest"
+    depends_on: "all-gather-matmul-w4a4_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a4"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a4_PerformanceTest
@@ -0,0 +1,45 @@
+# all-gather-matmul-w4a8
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w4a8"
+    key: "all-gather-matmul-w4a8_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a8_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w4a8"
+    key: "record_all-gather-matmul-w4a8_CorrectnessTest"
+    depends_on: "all-gather-matmul-w4a8_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a8"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a8_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w4a8"
+    key: "all-gather-matmul-w4a8_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w4a8_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w4a8_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w4a8"
+    key: "record_all-gather-matmul-w4a8_PerformanceTest"
+    depends_on: "all-gather-matmul-w4a8_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w4a8"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w4a8_PerformanceTest
@@ -0,0 +1,45 @@
+# all-gather-matmul-w8a16
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w8a16"
+    key: "all-gather-matmul-w8a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w8a16_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w8a16"
+    key: "record_all-gather-matmul-w8a16_CorrectnessTest"
+    depends_on: "all-gather-matmul-w8a16_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w8a16"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w8a16_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w8a16"
+    key: "all-gather-matmul-w8a16_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w8a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w8a16_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w8a16"
+    key: "record_all-gather-matmul-w8a16_PerformanceTest"
+    depends_on: "all-gather-matmul-w8a16_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w8a16"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w8a16_PerformanceTest
@@ -0,0 +1,45 @@
+# all-gather-matmul-w8a8
+# kernel support matrix microbenchmarks
+steps:
+  - label: "Correctness tests for all-gather-matmul-w8a8"
+    key: "all-gather-matmul-w8a8_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w8a8_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for all-gather-matmul-w8a8"
+    key: "record_all-gather-matmul-w8a8_CorrectnessTest"
+    depends_on: "all-gather-matmul-w8a8_CorrectnessTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w8a8"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w8a8_CorrectnessTest
+
+  - label: "Performance tests for all-gather-matmul-w8a8"
+    key: "all-gather-matmul-w8a8_PerformanceTest"
+    depends_on: "record_all-gather-matmul-w8a8_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "all-gather-matmul-w8a8_PerformanceTest" "to be added"
+  - label: "Record performance test result for all-gather-matmul-w8a8"
+    key: "record_all-gather-matmul-w8a8_PerformanceTest"
+    depends_on: "all-gather-matmul-w8a8_PerformanceTest"
+    env:
+      CI_TARGET: "all-gather-matmul-w8a8"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh all-gather-matmul-w8a8_PerformanceTest
@@ -0,0 +1,46 @@
+# attention_kernels-w16a16
+# kernel support matrix microbenchmarks
+# For attention kernels, W[x]A[y] denotes KV cache as W, A as compute, and x, y as bit precision-w16a16
+steps:
+  - label: "Correctness tests for attention kernels-w16a16"
+    key: "attention_kernels-w16a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "attention_kernels-w16a16_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for attention kernels-w16a16"
+    key: "record_attention_kernels-w16a16_CorrectnessTest"
+    depends_on: "attention_kernels-w16a16_CorrectnessTest"
+    env:
+      CI_TARGET: "attention_kernels-w16a16"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh attention_kernels-w16a16_CorrectnessTest
+
+  - label: "Performance tests for attention kernels-w16a16"
+    key: "attention_kernels-w16a16_PerformanceTest"
+    depends_on: "record_attention_kernels-w16a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "attention_kernels-w16a16_PerformanceTest" "to be added"
+  - label: "Record performance test result for attention kernels-w16a16"
+    key: "record_attention_kernels-w16a16_PerformanceTest"
+    depends_on: "attention_kernels-w16a16_PerformanceTest"
+    env:
+      CI_TARGET: "attention_kernels-w16a16"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh attention_kernels-w16a16_PerformanceTest
@@ -0,0 +1,46 @@
+# attention_kernels-w4a16
+# kernel support matrix microbenchmarks
+# For attention kernels, W[x]A[y] denotes KV cache as W, A as compute, and x, y as bit precision-w4a16
+steps:
+  - label: "Correctness tests for attention kernels-w4a16"
+    key: "attention_kernels-w4a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "attention_kernels-w4a16_CorrectnessTest" "to be added"
+  - label: "Record correctness test result for attention kernels-w4a16"
+    key: "record_attention_kernels-w4a16_CorrectnessTest"
+    depends_on: "attention_kernels-w4a16_CorrectnessTest"
+    env:
+      CI_TARGET: "attention_kernels-w4a16"
+      CI_STAGE: "CorrectnessTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh attention_kernels-w4a16_CorrectnessTest
+
+  - label: "Performance tests for attention kernels-w4a16"
+    key: "attention_kernels-w4a16_PerformanceTest"
+    depends_on: "record_attention_kernels-w4a16_CorrectnessTest"
+    soft_fail: true
+    agents:
+      queue: tpu_v6e_queue
+    commands:
+      - |
+        buildkite-agent meta-data set "attention_kernels-w4a16_PerformanceTest" "to be added"
+  - label: "Record performance test result for attention kernels-w4a16"
+    key: "record_attention_kernels-w4a16_PerformanceTest"
+    depends_on: "attention_kernels-w4a16_PerformanceTest"
+    env:
+      CI_TARGET: "attention_kernels-w4a16"
+      CI_STAGE: "PerformanceTest"
+      CI_CATEGORY: "kernel support matrix microbenchmarks"
+    agents:
+      queue: cpu
+    commands:
+      - |
+        .buildkite/scripts/record_step_result.sh attention_kernels-w4a16_PerformanceTest