mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 07:14:58 +08:00
72 lines
2.4 KiB
Python
72 lines
2.4 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
import pytest
|
|
|
|
from vllm.engine.arg_utils import EngineArgs
|
|
from vllm.model_executor.layers.quantization.quark.utils import deep_compare
|
|
|
|
|
|
def test_cuda_empty_vs_unset_configs(monkeypatch: pytest.MonkeyPatch):
|
|
"""Test that configs created with normal (untouched) CUDA_VISIBLE_DEVICES
|
|
and CUDA_VISIBLE_DEVICES="" are equivalent. This ensures consistent
|
|
behavior regardless of whether GPU visibility is disabled via empty string
|
|
or left in its normal state.
|
|
"""
|
|
|
|
def create_config():
|
|
engine_args = EngineArgs(model="deepseek-ai/DeepSeek-V2-Lite",
|
|
trust_remote_code=True)
|
|
return engine_args.create_engine_config()
|
|
|
|
# Create config with CUDA_VISIBLE_DEVICES set normally
|
|
normal_config = create_config()
|
|
|
|
# Create config with CUDA_VISIBLE_DEVICES=""
|
|
with monkeypatch.context() as m:
|
|
m.setenv("CUDA_VISIBLE_DEVICES", "")
|
|
empty_config = create_config()
|
|
|
|
normal_config_dict = vars(normal_config)
|
|
empty_config_dict = vars(empty_config)
|
|
|
|
# Remove instance_id before comparison as it's expected to be different
|
|
normal_config_dict.pop("instance_id", None)
|
|
empty_config_dict.pop("instance_id", None)
|
|
|
|
assert deep_compare(normal_config_dict, empty_config_dict), (
|
|
"Configs with normal CUDA_VISIBLE_DEVICES and CUDA_VISIBLE_DEVICES=\"\""
|
|
" should be equivalent")
|
|
|
|
|
|
def test_ray_runtime_env(monkeypatch: pytest.MonkeyPatch):
|
|
# In testing, this method needs to be nested inside as ray does not
|
|
# see the test module.
|
|
def create_config():
|
|
engine_args = EngineArgs(model="deepseek-ai/DeepSeek-V2-Lite",
|
|
trust_remote_code=True)
|
|
return engine_args.create_engine_config()
|
|
|
|
config = create_config()
|
|
parallel_config = config.parallel_config
|
|
assert parallel_config.ray_runtime_env is None
|
|
|
|
import ray
|
|
ray.init()
|
|
|
|
runtime_env = {
|
|
"env_vars": {
|
|
"TEST_ENV_VAR": "test_value",
|
|
},
|
|
}
|
|
|
|
config_ref = ray.remote(create_config).options(
|
|
runtime_env=runtime_env).remote()
|
|
|
|
config = ray.get(config_ref)
|
|
parallel_config = config.parallel_config
|
|
assert parallel_config.ray_runtime_env is not None
|
|
assert parallel_config.ray_runtime_env.env_vars().get(
|
|
"TEST_ENV_VAR") == "test_value"
|
|
|
|
ray.shutdown()
|