Bump arctic-inference requirement (#28174)

Co-authored-by: Aurick Qiao <aurick.qiao@snowflake.com>
Co-authored-by: Wentao Ye <44945378+yewentao256@users.noreply.github.com>
This commit is contained in:
Aurick Qiao 2025-11-07 18:31:18 -08:00 committed by GitHub
parent 0852527647
commit 781f5ebf52
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 3 additions and 3 deletions

View File

@ -48,7 +48,7 @@ buildkite-test-collector==0.1.9
genai_perf==0.0.8
tritonclient==2.51.0
arctic-inference == 0.1.0 # Required for suffix decoding test
arctic-inference == 0.1.1 # Required for suffix decoding test
numba == 0.61.2 # Required for N-gram speculative decoding
numpy
runai-model-streamer[s3,gcs]==0.15.0

View File

@ -40,7 +40,7 @@ anyio==4.6.2.post1
# via
# httpx
# starlette
arctic-inference==0.1.0
arctic-inference==0.1.1
# via -r requirements/test.in
argcomplete==3.5.1
# via datamodel-code-generator

View File

@ -469,7 +469,7 @@ class SpeculativeConfig:
if not has_arctic_inference():
raise ImportError(
"Arctic Inference is required for suffix decoding. "
"Install via `pip install arctic-inference==0.1.0`."
"Install via `pip install arctic-inference==0.1.1`."
)
if self.num_speculative_tokens is None:
# Suffix decoding decides the actual number of speculative tokens