Skip to content

Commit b7302c6

Browse files
authored
[nightly ut] reduce memory usage and skip deepseek on machines without avx512_bf16 support (#3664)
1 parent 03cb4d8 commit b7302c6

File tree

2 files changed

+7
-2
lines changed

2 files changed

+7
-2
lines changed

tests/cpu/hf_configs/mllama/config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@
3939
"forced_bos_token_id": null,
4040
"forced_eos_token_id": null,
4141
"hidden_act": "silu",
42-
"hidden_size": 4096,
42+
"hidden_size": 1024,
4343
"id2label": {
4444
"0": "LABEL_0",
4545
"1": "LABEL_1"

tests/cpu/test_ipex_optimize_transformers_nightly.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -302,7 +302,7 @@ def model_replacement_check(
302302
elif m.name == "jamba":
303303
model.config.dtype = dtype
304304
model.eval()
305-
ref_m = copy.deepcopy(model)
305+
ref_m = model
306306
ipex_m = copy.deepcopy(model)
307307
ipex_m = ipex.llm.optimize(
308308
ipex_m, dtype=dtype, deployment_mode=deployment_mode, inplace=True
@@ -428,6 +428,11 @@ def test_model_replacement(self):
428428
):
429429
if torchcompile and deployment_mode:
430430
continue
431+
if (
432+
m.name in ["deepseekv2", "deepseekv3"]
433+
and not core.isa_has_avx512_bf16_support()
434+
):
435+
continue
431436
self.model_replacement_check(m, dtype, jit, torchcompile, ret_dict)
432437
_disable_tpp()
433438

0 commit comments

Comments
 (0)