Skip to content

Commit 0bcc518

Browse files
committed
testing
1 parent b50dd01 commit 0bcc518

File tree

6 files changed

+3521
-3405
lines changed

6 files changed

+3521
-3405
lines changed

log-fp4.log

Lines changed: 271 additions & 279 deletions
Large diffs are not rendered by default.

log-int4.log

Lines changed: 3244 additions & 3120 deletions
Large diffs are not rendered by default.

run.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,8 @@
77
export TEST_DATA_FILE="${REPOS}/llm-compressor/tests/e2e/vLLM/configs/w4a16_channel_quant_moe.yaml"
88
pytest tests/e2e/vLLM/test_vllm.py -vs 2>&1 | tee log-int4.log
99

10-
export TEST_DATA_FILE="${REPOS}/llm-compressor/tests/e2e/vLLM/configs/fp4_nvfp4_moe.yaml"
11-
pytest tests/e2e/vLLM/test_vllm.py -vs 2>&1 | tee log-fp4.log
10+
# export TEST_DATA_FILE="${REPOS}/llm-compressor/tests/e2e/vLLM/configs/fp4_nvfp4_moe.yaml"
11+
# pytest tests/e2e/vLLM/test_vllm.py -vs 2>&1 | tee log-fp4.log
1212

1313

1414

tests/e2e/e2e_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,7 @@ def data_collator(batch):
7777
}
7878

7979
oneshot_kwargs["data_collator"] = data_collator
80-
80+
print("CDH", recipe, scheme)
8181
oneshot_kwargs["model"] = loaded_model
8282
if recipe:
8383
oneshot_kwargs["recipe"] = recipe

tests/e2e/vLLM/configs/w4a16_channel_quant_moe.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,9 @@ cadence: "nightly"
22
test_type: "regression"
33
model: Qwen/Qwen3-VL-30B-A3B-Instruct
44
model_class: "Qwen3VLMoeForConditionalGeneration"
5-
scheme: W4A16
5+
# scheme: W4A16
66
num_calibration_samples: 20
77
dataset_id: neuralmagic/calibration
88
dataset_split: train
99
dataset_config: LLM
10-
quant_type: "GPTQ"
10+
recipe: "tests/e2e/vLLM/recipes/WNA16/recipe_w4a16_gptq.yaml"

tests/e2e/vLLM/run_vllm.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ def parse_args():
1818
except json.JSONDecodeError as e:
1919
raise ValueError(f"Invalid JSON input: {e}")
2020

21-
if "W4A16_2of4" in scheme:
21+
if scheme is not None and "W4A16_2of4" in scheme:
2222
# required by the kernel
2323
llm_kwargs["dtype"] = torch.float16
2424

0 commit comments

Comments
 (0)