[Bugfix] Add quantization param for multi-node CI (#3383)

### What this PR does / why we need it?
Add quantization param for `deepseek-w8a8` multi-node test
### Does this PR introduce _any_ user-facing change?

### How was this patch tested?

- vLLM version: v0.11.0rc3
- vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.0

Signed-off-by: wangli <wangli858794774@gmail.com>
This commit is contained in:
Li Wang
2025-10-11 19:25:16 +08:00
committed by GitHub
parent e8c871ed0a
commit 1b1207e3c3

View File

@ -7,6 +7,7 @@
"server_parameters": {
"leader_config": {
"model": "vllm-ascend/DeepSeek-V3-W8A8",
"quantization": "ascend",
"additional_config": {
"ascend_scheduler_config": {
"enabled": true
@ -18,6 +19,7 @@
},
"worker_config": {
"model": "vllm-ascend/DeepSeek-V3-W8A8",
"quantization": "ascend",
"additional_config": {
"ascend_scheduler_config": {
"enabled": true