mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-23 14:17:59 +08:00
[CI/Build] Skip cpu offloading test on AMD (#27690)
Signed-off-by: zhewenli <zhewenli@meta.com>
This commit is contained in:
parent
ad3ec89532
commit
9a0d2f0d92
@ -12,6 +12,7 @@ from tqdm import tqdm
|
|||||||
from vllm import LLM, SamplingParams, TokensPrompt
|
from vllm import LLM, SamplingParams, TokensPrompt
|
||||||
from vllm.config import KVEventsConfig, KVTransferConfig
|
from vllm.config import KVEventsConfig, KVTransferConfig
|
||||||
from vllm.distributed.kv_events import BlockStored, KVEventBatch
|
from vllm.distributed.kv_events import BlockStored, KVEventBatch
|
||||||
|
from vllm.platforms import current_platform
|
||||||
|
|
||||||
CPU_BLOCK_SIZES = [16, 48]
|
CPU_BLOCK_SIZES = [16, 48]
|
||||||
|
|
||||||
@ -63,6 +64,9 @@ class MockSubscriber:
|
|||||||
self.sub.close()
|
self.sub.close()
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skipif(
|
||||||
|
not current_platform.is_cuda(), reason="CPU offloading only supported on CUDA"
|
||||||
|
)
|
||||||
@pytest.mark.parametrize("cpu_block_size", CPU_BLOCK_SIZES)
|
@pytest.mark.parametrize("cpu_block_size", CPU_BLOCK_SIZES)
|
||||||
def test_cpu_offloading(cpu_block_size: int) -> None:
|
def test_cpu_offloading(cpu_block_size: int) -> None:
|
||||||
"""
|
"""
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user