mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-05 07:55:40 +08:00
[Bugfix] fix type hint for py 3.8 (#4036)
This commit is contained in:
parent
36729bac13
commit
96b6a6d790
@ -1,5 +1,5 @@
|
|||||||
from abc import ABC, abstractmethod
|
from abc import ABC, abstractmethod
|
||||||
from typing import Dict, List, Optional
|
from typing import Dict, List, Optional, Tuple
|
||||||
|
|
||||||
from vllm.config import (CacheConfig, DeviceConfig, LoRAConfig, ModelConfig,
|
from vllm.config import (CacheConfig, DeviceConfig, LoRAConfig, ModelConfig,
|
||||||
ParallelConfig, SchedulerConfig, SpeculativeConfig,
|
ParallelConfig, SchedulerConfig, SpeculativeConfig,
|
||||||
@ -31,7 +31,7 @@ class ExecutorBase(ABC):
|
|||||||
raise NotImplementedError
|
raise NotImplementedError
|
||||||
|
|
||||||
@abstractmethod
|
@abstractmethod
|
||||||
def determine_num_available_blocks(self) -> tuple[int, int]:
|
def determine_num_available_blocks(self) -> Tuple[int, int]:
|
||||||
"""Determine the number of available blocks for the GPU KV cache and
|
"""Determine the number of available blocks for the GPU KV cache and
|
||||||
swappable CPU KV cache.
|
swappable CPU KV cache.
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user