Skip to content

Commit 7ccd6c5

Browse files
authored
Introduce cpu agents for general-purpose tasks that don't require TPU (#1012)
Signed-off-by: Johnny Yang <johnnyyang@google.com>
1 parent 92f94be commit 7ccd6c5

25 files changed

+64
-65
lines changed

.buildkite/features/Chunked_Prefill.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Chunked Prefill"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Chunked_Prefill_CorrectnessTest
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: "Chunked Prefill"
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Chunked_Prefill_PerformanceTest

.buildkite/features/Collective_Communication_Matmul.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Collective Communication Matmul"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Collective_Communication_Matmul_CorrectnessTest

.buildkite/features/JAX-Path_Qxix_Quantization.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "JAX-Path Qxix Quantization"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh JAX-Path_Qxix_Quantization_CorrectnessTest
@@ -36,7 +36,7 @@ steps:
3636
CI_TARGET: "JAX-Path Qxix Quantization"
3737
CI_STAGE: "PerformanceTest"
3838
agents:
39-
queue: tpu_v6e_queue
39+
queue: cpu
4040
commands:
4141
- |
4242
.buildkite/scripts/record_step_result.sh JAX-Path_Qxix_Quantization_PerformanceTest

.buildkite/features/Multimodal_Inputs.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: Multimodal Inputs
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Multimodal_Inputs_CorrectnessTest
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: Multimodal Inputs
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Multimodal_Inputs_PerformanceTest

.buildkite/features/Prefix_Caching.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ steps:
44
key: "Prefix_Caching_CorrectnessTest"
55
soft_fail: true
66
agents:
7-
queue: tpu_v6e_queue
7+
queue: cpu
88
commands:
99
- echo "default on in vLLM"
1010
- label: "Record correctness test result for Prefix Caching"
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Prefix Caching"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Prefix_Caching_CorrectnessTest
@@ -24,7 +24,7 @@ steps:
2424
depends_on: "record_Prefix_Caching_CorrectnessTest"
2525
soft_fail: true
2626
agents:
27-
queue: tpu_v6e_queue
27+
queue: cpu
2828
commands:
2929
- echo "default on in vLLM"
3030
- label: "Record performance test result for Prefix Caching"
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: "Prefix Caching"
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Prefix_Caching_PerformanceTest

.buildkite/features/Quantized_Matmul_Attention_and_KV_Cache.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ steps:
44
key: "Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest"
55
soft_fail: true
66
agents:
7-
queue: tpu_v6e_queue
7+
queue: cpu
88
commands:
99
- echo "covered by performance test"
1010
- label: "Record correctness test result for Quantized Matmul Attention and KV Cache"
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Quantized Matmul Attention and KV Cache"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_CorrectnessTest
@@ -45,7 +45,7 @@ steps:
4545
CI_TARGET: "Quantized Matmul Attention and KV Cache"
4646
CI_STAGE: "PerformanceTest"
4747
agents:
48-
queue: tpu_v6e_queue
48+
queue: cpu
4949
commands:
5050
- |
5151
.buildkite/scripts/record_step_result.sh Quantized_Matmul_Attention_and_KV_Cache_PerformanceTest

.buildkite/features/Ragged_Paged_Attention_V3.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ steps:
44
key: "Ragged_Paged_Attention_V3_CorrectnessTest"
55
soft_fail: true
66
agents:
7-
queue: tpu_v6e_queue
7+
queue: cpu
88
commands:
99
- echo "default on in vLLM"
1010
- label: "Record correctness test result for Ragged Paged Attention V3"
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Ragged Paged Attention V3"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Ragged_Paged_Attention_V3_CorrectnessTest
@@ -24,7 +24,7 @@ steps:
2424
depends_on: "record_Ragged_Paged_Attention_V3_CorrectnessTest"
2525
soft_fail: true
2626
agents:
27-
queue: tpu_v6e_queue
27+
queue: cpu
2828
commands:
2929
- echo "default on in vLLM"
3030
- label: "Record performance test result for Ragged Paged Attention V3"
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: "Ragged Paged Attention V3"
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Ragged_Paged_Attention_V3_PerformanceTest

.buildkite/features/Single_Program_Multi_Data.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ steps:
44
key: "Single_Program_Multi_Data__CorrectnessTest"
55
soft_fail: true
66
agents:
7-
queue: tpu_v6e_queue
7+
queue: cpu
88
commands:
99
- echo "default on in vLLM"
1010
- label: "Record correctness test result for Single Program Multi Data"
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Single Program Multi Data"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Single_Program_Multi_Data__CorrectnessTest
@@ -24,7 +24,7 @@ steps:
2424
depends_on: "record_Single_Program_Multi_Data__CorrectnessTest"
2525
soft_fail: true
2626
agents:
27-
queue: tpu_v6e_queue
27+
queue: cpu
2828
commands:
2929
- echo "default on in vLLM"
3030
- label: "Record performance test result for Single Program Multi Data"
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: "Single Program Multi Data"
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Single_Program_Multi_Data__PerformanceTest

.buildkite/features/Speculative_Decoding-_Ngram.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ steps:
44
key: "Speculative_Decoding-_Ngram_CorrectnessTest"
55
soft_fail: true
66
agents:
7-
queue: tpu_v6e_queue
7+
queue: cpu
88
commands:
99
- echo "covered by performance test"
1010
- label: "Record correctness test result for Speculative Decoding: Ngram"
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: "Speculative Decoding: Ngram"
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Speculative_Decoding-_Ngram_CorrectnessTest
@@ -24,7 +24,7 @@ steps:
2424
depends_on: "record_Speculative_Decoding-_Ngram_CorrectnessTest"
2525
soft_fail: true
2626
agents:
27-
queue: tpu_v6e_queue
27+
queue: cpu
2828
commands:
2929
- .buildkite/scripts/run_in_docker.sh python3 -m pytest -s -v /workspace/tpu_inference/tests/e2e/test_speculative_decoding.py
3030
- label: "Record performance test result for Speculative Decoding: Ngram"
@@ -34,7 +34,7 @@ steps:
3434
CI_TARGET: "Speculative Decoding: Ngram"
3535
CI_STAGE: "PerformanceTest"
3636
agents:
37-
queue: tpu_v6e_queue
37+
queue: cpu
3838
commands:
3939
- |
4040
.buildkite/scripts/record_step_result.sh Speculative_Decoding-_Ngram_PerformanceTest

.buildkite/features/Structured_Decoding.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ steps:
1414
CI_TARGET: Structured Decoding
1515
CI_STAGE: "CorrectnessTest"
1616
agents:
17-
queue: tpu_v6e_queue
17+
queue: cpu
1818
commands:
1919
- |
2020
.buildkite/scripts/record_step_result.sh Structured_Decoding_CorrectnessTest

0 commit comments

Comments
 (0)