mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-23 15:04:32 +08:00
Bump arctic-inference requirement (#28174)
Co-authored-by: Aurick Qiao <aurick.qiao@snowflake.com> Co-authored-by: Wentao Ye <44945378+yewentao256@users.noreply.github.com>
This commit is contained in:
parent
0852527647
commit
781f5ebf52
@ -48,7 +48,7 @@ buildkite-test-collector==0.1.9
|
||||
genai_perf==0.0.8
|
||||
tritonclient==2.51.0
|
||||
|
||||
arctic-inference == 0.1.0 # Required for suffix decoding test
|
||||
arctic-inference == 0.1.1 # Required for suffix decoding test
|
||||
numba == 0.61.2 # Required for N-gram speculative decoding
|
||||
numpy
|
||||
runai-model-streamer[s3,gcs]==0.15.0
|
||||
|
||||
@ -40,7 +40,7 @@ anyio==4.6.2.post1
|
||||
# via
|
||||
# httpx
|
||||
# starlette
|
||||
arctic-inference==0.1.0
|
||||
arctic-inference==0.1.1
|
||||
# via -r requirements/test.in
|
||||
argcomplete==3.5.1
|
||||
# via datamodel-code-generator
|
||||
|
||||
@ -469,7 +469,7 @@ class SpeculativeConfig:
|
||||
if not has_arctic_inference():
|
||||
raise ImportError(
|
||||
"Arctic Inference is required for suffix decoding. "
|
||||
"Install via `pip install arctic-inference==0.1.0`."
|
||||
"Install via `pip install arctic-inference==0.1.1`."
|
||||
)
|
||||
if self.num_speculative_tokens is None:
|
||||
# Suffix decoding decides the actual number of speculative tokens
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user