Skip to content

Commit 3f298b9

Browse files
committed
add new kernel and quantization support matrices (#1275)
Signed-off-by: Teresa Chen <[email protected]>
1 parent 8f30493 commit 3f298b9

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

47 files changed

+2055
-20
lines changed
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w16a16
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w16a16"
5+
key: "all-gather-matmul-w16a16_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w16a16_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w16a16"
13+
key: "record_all-gather-matmul-w16a16_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w16a16_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w16a16"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w16a16_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w16a16"
26+
key: "all-gather-matmul-w16a16_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w16a16_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w16a16_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w16a16"
35+
key: "record_all-gather-matmul-w16a16_PerformanceTest"
36+
depends_on: "all-gather-matmul-w16a16_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w16a16"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w16a16_PerformanceTest
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w4a16
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w4a16"
5+
key: "all-gather-matmul-w4a16_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w4a16_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w4a16"
13+
key: "record_all-gather-matmul-w4a16_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w4a16_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w4a16"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a16_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w4a16"
26+
key: "all-gather-matmul-w4a16_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w4a16_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w4a16_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w4a16"
35+
key: "record_all-gather-matmul-w4a16_PerformanceTest"
36+
depends_on: "all-gather-matmul-w4a16_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w4a16"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a16_PerformanceTest
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w4a4
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w4a4"
5+
key: "all-gather-matmul-w4a4_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w4a4_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w4a4"
13+
key: "record_all-gather-matmul-w4a4_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w4a4_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w4a4"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a4_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w4a4"
26+
key: "all-gather-matmul-w4a4_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w4a4_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w4a4_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w4a4"
35+
key: "record_all-gather-matmul-w4a4_PerformanceTest"
36+
depends_on: "all-gather-matmul-w4a4_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w4a4"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a4_PerformanceTest
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w4a8
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w4a8"
5+
key: "all-gather-matmul-w4a8_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w4a8_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w4a8"
13+
key: "record_all-gather-matmul-w4a8_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w4a8_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w4a8"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a8_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w4a8"
26+
key: "all-gather-matmul-w4a8_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w4a8_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w4a8_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w4a8"
35+
key: "record_all-gather-matmul-w4a8_PerformanceTest"
36+
depends_on: "all-gather-matmul-w4a8_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w4a8"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w4a8_PerformanceTest
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w8a16
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w8a16"
5+
key: "all-gather-matmul-w8a16_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w8a16_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w8a16"
13+
key: "record_all-gather-matmul-w8a16_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w8a16_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w8a16"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w8a16_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w8a16"
26+
key: "all-gather-matmul-w8a16_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w8a16_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w8a16_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w8a16"
35+
key: "record_all-gather-matmul-w8a16_PerformanceTest"
36+
depends_on: "all-gather-matmul-w8a16_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w8a16"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w8a16_PerformanceTest
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
# all-gather-matmul-w8a8
2+
# kernel support matrix microbenchmarks
3+
steps:
4+
- label: "Correctness tests for all-gather-matmul-w8a8"
5+
key: "all-gather-matmul-w8a8_CorrectnessTest"
6+
soft_fail: true
7+
agents:
8+
queue: tpu_v6e_queue
9+
commands:
10+
- |
11+
buildkite-agent meta-data set "all-gather-matmul-w8a8_CorrectnessTest" "to be added"
12+
- label: "Record correctness test result for all-gather-matmul-w8a8"
13+
key: "record_all-gather-matmul-w8a8_CorrectnessTest"
14+
depends_on: "all-gather-matmul-w8a8_CorrectnessTest"
15+
env:
16+
CI_TARGET: "all-gather-matmul-w8a8"
17+
CI_STAGE: "CorrectnessTest"
18+
CI_CATEGORY: "kernel support matrix microbenchmarks"
19+
agents:
20+
queue: cpu
21+
commands:
22+
- |
23+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w8a8_CorrectnessTest
24+
25+
- label: "Performance tests for all-gather-matmul-w8a8"
26+
key: "all-gather-matmul-w8a8_PerformanceTest"
27+
depends_on: "record_all-gather-matmul-w8a8_CorrectnessTest"
28+
soft_fail: true
29+
agents:
30+
queue: tpu_v6e_queue
31+
commands:
32+
- |
33+
buildkite-agent meta-data set "all-gather-matmul-w8a8_PerformanceTest" "to be added"
34+
- label: "Record performance test result for all-gather-matmul-w8a8"
35+
key: "record_all-gather-matmul-w8a8_PerformanceTest"
36+
depends_on: "all-gather-matmul-w8a8_PerformanceTest"
37+
env:
38+
CI_TARGET: "all-gather-matmul-w8a8"
39+
CI_STAGE: "PerformanceTest"
40+
CI_CATEGORY: "kernel support matrix microbenchmarks"
41+
agents:
42+
queue: cpu
43+
commands:
44+
- |
45+
.buildkite/scripts/record_step_result.sh all-gather-matmul-w8a8_PerformanceTest
Lines changed: 46 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,46 @@
1+
# attention_kernels-w16a16
2+
# kernel support matrix microbenchmarks
3+
# For attention kernels, W[x]A[y] denotes KV cache as W, A as compute, and x, y as bit precision-w16a16
4+
steps:
5+
- label: "Correctness tests for attention kernels-w16a16"
6+
key: "attention_kernels-w16a16_CorrectnessTest"
7+
soft_fail: true
8+
agents:
9+
queue: tpu_v6e_queue
10+
commands:
11+
- |
12+
buildkite-agent meta-data set "attention_kernels-w16a16_CorrectnessTest" "to be added"
13+
- label: "Record correctness test result for attention kernels-w16a16"
14+
key: "record_attention_kernels-w16a16_CorrectnessTest"
15+
depends_on: "attention_kernels-w16a16_CorrectnessTest"
16+
env:
17+
CI_TARGET: "attention_kernels-w16a16"
18+
CI_STAGE: "CorrectnessTest"
19+
CI_CATEGORY: "kernel support matrix microbenchmarks"
20+
agents:
21+
queue: cpu
22+
commands:
23+
- |
24+
.buildkite/scripts/record_step_result.sh attention_kernels-w16a16_CorrectnessTest
25+
26+
- label: "Performance tests for attention kernels-w16a16"
27+
key: "attention_kernels-w16a16_PerformanceTest"
28+
depends_on: "record_attention_kernels-w16a16_CorrectnessTest"
29+
soft_fail: true
30+
agents:
31+
queue: tpu_v6e_queue
32+
commands:
33+
- |
34+
buildkite-agent meta-data set "attention_kernels-w16a16_PerformanceTest" "to be added"
35+
- label: "Record performance test result for attention kernels-w16a16"
36+
key: "record_attention_kernels-w16a16_PerformanceTest"
37+
depends_on: "attention_kernels-w16a16_PerformanceTest"
38+
env:
39+
CI_TARGET: "attention_kernels-w16a16"
40+
CI_STAGE: "PerformanceTest"
41+
CI_CATEGORY: "kernel support matrix microbenchmarks"
42+
agents:
43+
queue: cpu
44+
commands:
45+
- |
46+
.buildkite/scripts/record_step_result.sh attention_kernels-w16a16_PerformanceTest
Lines changed: 46 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,46 @@
1+
# attention_kernels-w4a16
2+
# kernel support matrix microbenchmarks
3+
# For attention kernels, W[x]A[y] denotes KV cache as W, A as compute, and x, y as bit precision-w4a16
4+
steps:
5+
- label: "Correctness tests for attention kernels-w4a16"
6+
key: "attention_kernels-w4a16_CorrectnessTest"
7+
soft_fail: true
8+
agents:
9+
queue: tpu_v6e_queue
10+
commands:
11+
- |
12+
buildkite-agent meta-data set "attention_kernels-w4a16_CorrectnessTest" "to be added"
13+
- label: "Record correctness test result for attention kernels-w4a16"
14+
key: "record_attention_kernels-w4a16_CorrectnessTest"
15+
depends_on: "attention_kernels-w4a16_CorrectnessTest"
16+
env:
17+
CI_TARGET: "attention_kernels-w4a16"
18+
CI_STAGE: "CorrectnessTest"
19+
CI_CATEGORY: "kernel support matrix microbenchmarks"
20+
agents:
21+
queue: cpu
22+
commands:
23+
- |
24+
.buildkite/scripts/record_step_result.sh attention_kernels-w4a16_CorrectnessTest
25+
26+
- label: "Performance tests for attention kernels-w4a16"
27+
key: "attention_kernels-w4a16_PerformanceTest"
28+
depends_on: "record_attention_kernels-w4a16_CorrectnessTest"
29+
soft_fail: true
30+
agents:
31+
queue: tpu_v6e_queue
32+
commands:
33+
- |
34+
buildkite-agent meta-data set "attention_kernels-w4a16_PerformanceTest" "to be added"
35+
- label: "Record performance test result for attention kernels-w4a16"
36+
key: "record_attention_kernels-w4a16_PerformanceTest"
37+
depends_on: "attention_kernels-w4a16_PerformanceTest"
38+
env:
39+
CI_TARGET: "attention_kernels-w4a16"
40+
CI_STAGE: "PerformanceTest"
41+
CI_CATEGORY: "kernel support matrix microbenchmarks"
42+
agents:
43+
queue: cpu
44+
commands:
45+
- |
46+
.buildkite/scripts/record_step_result.sh attention_kernels-w4a16_PerformanceTest

0 commit comments

Comments
 (0)