Skip to content

Commit 454583c

Browse files
committed
update acc
Signed-off-by: jiangyunfan1 <jiangyunfan1@h-partners.com>
1 parent cbb27fe commit 454583c

File tree

2 files changed

+33
-2
lines changed

2 files changed

+33
-2
lines changed

.github/workflows/vllm_ascend_test_nightly_a3.yaml

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -141,3 +141,20 @@ jobs:
141141
image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-a3'
142142
tests: ${{ matrix.test_config.tests }}
143143
name: ${{ matrix.test_config.name }}
144+
145+
single-node-tests2:
146+
name: single-node
147+
strategy:
148+
fail-fast: false
149+
matrix:
150+
test_config:
151+
- name: deepseek-r1-w8a8-mtpx
152+
os: linux-aarch64-a3-16
153+
tests: tests/e2e/nightly/features/test_mtpx_deepseek_r1_0528_w8a8.py
154+
uses: ./.github/workflows/_e2e_nightly_single_node.yaml
155+
with:
156+
vllm: v0.11.0
157+
runner: ${{ matrix.test_config.os }}
158+
image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-a3'
159+
tests: ${{ matrix.test_config.tests }}
160+
name: ${{ matrix.test_config.name }}

tests/e2e/nightly/features/test_mtpx_deepseek_r1_0528_w8a8.py

Lines changed: 16 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -38,17 +38,30 @@
3838
"max_tokens": 10,
3939
}
4040

41-
aisbench_cases = [{
41+
aisbench_gsm8k = [{
42+
"case_type": "accuracy",
43+
"dataset_path": "vllm-ascend/gsm8k-lite",
44+
"request_conf": "vllm_api_general_chat",
45+
"dataset_conf": "gsm8k/gsm8k_gen_0_shot_noncot_chat_prompt",
46+
"max_out_len": 32768,
47+
"batch_size": 32,
48+
"baseline": 95,
49+
"threshold": 5
50+
}]
51+
52+
aisbench_aime = [{
4253
"case_type": "accuracy",
4354
"dataset_path": "vllm-ascend/aime2024",
4455
"request_conf": "vllm_api_general_chat",
4556
"dataset_conf": "aime2024/aime2024_gen_0_shot_chat_prompt",
4657
"max_out_len": 32768,
4758
"batch_size": 32,
48-
"baseline": 80,
59+
"baseline": 86.67,
4960
"threshold": 7
5061
}]
5162

63+
aisbench_case_dict = {"mtp2": aisbench_gsm8k, "mtp3": aisbench_aime}
64+
5265

5366
@pytest.mark.asyncio
5467
@pytest.mark.parametrize("model", MODELS)
@@ -132,6 +145,7 @@ async def test_models(model: str, mode: str) -> None:
132145
assert choices[0].text, "empty response"
133146
print(choices)
134147
# aisbench test
148+
aisbench_cases = aisbench_case_dict[mode]
135149
run_aisbench_cases(model,
136150
port,
137151
aisbench_cases,

0 commit comments

Comments
 (0)