mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
76 lines
2.4 KiB
Python
76 lines
2.4 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
import pytest
|
|
|
|
from vllm.engine.arg_utils import EngineArgs
|
|
from vllm.model_executor.layers.quantization.quark.utils import deep_compare
|
|
|
|
|
|
def test_cuda_empty_vs_unset_configs(monkeypatch: pytest.MonkeyPatch):
|
|
"""Test that configs created with normal (untouched) CUDA_VISIBLE_DEVICES
|
|
and CUDA_VISIBLE_DEVICES="" are equivalent. This ensures consistent
|
|
behavior regardless of whether GPU visibility is disabled via empty string
|
|
or left in its normal state.
|
|
"""
|
|
|
|
def create_config():
|
|
engine_args = EngineArgs(
|
|
model="deepseek-ai/DeepSeek-V2-Lite", trust_remote_code=True
|
|
)
|
|
return engine_args.create_engine_config()
|
|
|
|
# Create config with CUDA_VISIBLE_DEVICES set normally
|
|
normal_config = create_config()
|
|
|
|
# Create config with CUDA_VISIBLE_DEVICES=""
|
|
with monkeypatch.context() as m:
|
|
m.setenv("CUDA_VISIBLE_DEVICES", "")
|
|
empty_config = create_config()
|
|
|
|
normal_config_dict = vars(normal_config)
|
|
empty_config_dict = vars(empty_config)
|
|
|
|
# Remove instance_id before comparison as it's expected to be different
|
|
normal_config_dict.pop("instance_id", None)
|
|
empty_config_dict.pop("instance_id", None)
|
|
|
|
assert deep_compare(normal_config_dict, empty_config_dict), (
|
|
'Configs with normal CUDA_VISIBLE_DEVICES and CUDA_VISIBLE_DEVICES=""'
|
|
" should be equivalent"
|
|
)
|
|
|
|
|
|
def test_ray_runtime_env(monkeypatch: pytest.MonkeyPatch):
|
|
# In testing, this method needs to be nested inside as ray does not
|
|
# see the test module.
|
|
def create_config():
|
|
engine_args = EngineArgs(
|
|
model="deepseek-ai/DeepSeek-V2-Lite", trust_remote_code=True
|
|
)
|
|
return engine_args.create_engine_config()
|
|
|
|
config = create_config()
|
|
parallel_config = config.parallel_config
|
|
assert parallel_config.ray_runtime_env is None
|
|
|
|
import ray
|
|
|
|
ray.init()
|
|
|
|
runtime_env = {
|
|
"env_vars": {
|
|
"TEST_ENV_VAR": "test_value",
|
|
},
|
|
}
|
|
|
|
config_ref = ray.remote(create_config).options(runtime_env=runtime_env).remote()
|
|
|
|
config = ray.get(config_ref)
|
|
parallel_config = config.parallel_config
|
|
assert parallel_config.ray_runtime_env is not None
|
|
assert (
|
|
parallel_config.ray_runtime_env.env_vars().get("TEST_ENV_VAR") == "test_value"
|
|
)
|
|
|
|
ray.shutdown()
|