mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 10:26:11 +08:00
[KV offload][1b/N] rename offloading to kv_offload (#25191)
Signed-off-by: Or Ozeri <oro@il.ibm.com>
This commit is contained in:
parent
1c3dad22ff
commit
a53ad626d6
@ -280,7 +280,7 @@ steps:
|
|||||||
# split the test to avoid interference
|
# split the test to avoid interference
|
||||||
- pytest -v -s v1/core
|
- pytest -v -s v1/core
|
||||||
- pytest -v -s v1/executor
|
- pytest -v -s v1/executor
|
||||||
- pytest -v -s v1/offloading
|
- pytest -v -s v1/kv_offload
|
||||||
- pytest -v -s v1/sample
|
- pytest -v -s v1/sample
|
||||||
- pytest -v -s v1/logits_processors
|
- pytest -v -s v1/logits_processors
|
||||||
- pytest -v -s v1/worker
|
- pytest -v -s v1/worker
|
||||||
|
|||||||
@ -1,7 +1,7 @@
|
|||||||
# SPDX-License-Identifier: Apache-2.0
|
# SPDX-License-Identifier: Apache-2.0
|
||||||
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
||||||
from vllm.v1.offloading.abstract import LoadStoreSpec
|
from vllm.v1.kv_offload.abstract import LoadStoreSpec
|
||||||
from vllm.v1.offloading.worker.worker import (OffloadingHandler,
|
from vllm.v1.kv_offload.worker.worker import (OffloadingHandler,
|
||||||
OffloadingWorker, TransferResult,
|
OffloadingWorker, TransferResult,
|
||||||
TransferSpec)
|
TransferSpec)
|
||||||
|
|
||||||
@ -4,7 +4,7 @@ from abc import ABC
|
|||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
|
|
||||||
from vllm.v1.offloading.abstract import LoadStoreSpec
|
from vllm.v1.kv_offload.abstract import LoadStoreSpec
|
||||||
|
|
||||||
|
|
||||||
class BlockIDsLoadStoreSpec(LoadStoreSpec, ABC):
|
class BlockIDsLoadStoreSpec(LoadStoreSpec, ABC):
|
||||||
@ -3,7 +3,7 @@
|
|||||||
from abc import ABC, abstractmethod
|
from abc import ABC, abstractmethod
|
||||||
|
|
||||||
from vllm.logger import init_logger
|
from vllm.logger import init_logger
|
||||||
from vllm.v1.offloading.abstract import LoadStoreSpec
|
from vllm.v1.kv_offload.abstract import LoadStoreSpec
|
||||||
|
|
||||||
# a single transfer spec (src_blocks_spec, dst_blocks_spec)
|
# a single transfer spec (src_blocks_spec, dst_blocks_spec)
|
||||||
TransferSpec = tuple[LoadStoreSpec, LoadStoreSpec]
|
TransferSpec = tuple[LoadStoreSpec, LoadStoreSpec]
|
||||||
Loading…
x
Reference in New Issue
Block a user