[Bugfix] Add quantization param for multi-node CI (#3383)

### What this PR does / why we need it? Add quantization param for `deepseek-w8a8` multi-node test ### Does this PR introduce _any_ user-facing change? ### How was this patch tested? - vLLM version: v0.11.0rc3 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.0 Signed-off-by: wangli <wangli858794774@gmail.com>
2025-10-20 13:43:53 +08:00 · 2025-10-11 19:25:16 +08:00
parent e8c871ed0a
commit 1b1207e3c3
1 changed files with 2 additions and 0 deletions
--- a/tests/e2e/multi_node/config/config.json
+++ b/tests/e2e/multi_node/config/config.json
@ -7,6 +7,7 @@
        "server_parameters": {
            "leader_config": {
                "model": "vllm-ascend/DeepSeek-V3-W8A8",
+                "quantization": "ascend",
                "additional_config": {
                    "ascend_scheduler_config": {
                        "enabled": true
@ -18,6 +19,7 @@
            },
            "worker_config": {
                "model": "vllm-ascend/DeepSeek-V3-W8A8",
+                "quantization": "ascend",
                "additional_config": {
                    "ascend_scheduler_config": {
                        "enabled": true