add more pytorch related tests for torch nightly (#17422)

Signed-off-by: Yang Wang <elainewy@meta.com>
This commit is contained in:
Yang Wang 2025-05-02 03:29:59 -07:00 committed by GitHub
parent d7543862bd
commit b8b0859b5c
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 14 additions and 4 deletions

View File

@ -293,6 +293,7 @@ steps:
parallelism: 4 parallelism: 4
- label: PyTorch Compilation Unit Tests - label: PyTorch Compilation Unit Tests
torch_nightly: true
source_file_dependencies: source_file_dependencies:
- vllm/ - vllm/
- tests/compile - tests/compile
@ -302,6 +303,7 @@ steps:
- pytest -v -s compile/test_sequence_parallelism.py - pytest -v -s compile/test_sequence_parallelism.py
- label: PyTorch Fullgraph Smoke Test # 9min - label: PyTorch Fullgraph Smoke Test # 9min
torch_nightly: true
source_file_dependencies: source_file_dependencies:
- vllm/ - vllm/
- tests/compile - tests/compile
@ -312,6 +314,7 @@ steps:
- pytest -v -s compile/piecewise/test_toy_llama.py - pytest -v -s compile/piecewise/test_toy_llama.py
- label: PyTorch Fullgraph Test # 18min - label: PyTorch Fullgraph Test # 18min
torch_nightly: true
source_file_dependencies: source_file_dependencies:
- vllm/ - vllm/
- tests/compile - tests/compile
@ -436,6 +439,7 @@ steps:
##### models test ##### ##### models test #####
- label: Basic Models Test # 24min - label: Basic Models Test # 24min
torch_nightly: true
source_file_dependencies: source_file_dependencies:
- vllm/ - vllm/
- tests/models - tests/models

View File

@ -23,5 +23,11 @@ runai-model-streamer-s3==0.11.0
tensorizer>=2.9.0 tensorizer>=2.9.0
lm-eval==0.4.8 lm-eval==0.4.8
buildkite-test-collector==0.1.9 buildkite-test-collector==0.1.9
lm-eval[api]==0.4.8 # required for model evaluation test lm-eval[api]==0.4.8 # required for model evaluation test
# required for quantization test
bitsandbytes>=0.45.3
# required for minicpmo_26 test
vector_quantize_pytorch
vocos

View File

@ -186,9 +186,9 @@ class SamplingParams(
logits_processors: list of functions that modify logits based on logits_processors: list of functions that modify logits based on
previously generated tokens, and optionally prompt tokens as previously generated tokens, and optionally prompt tokens as
a first argument. a first argument.
truncate_prompt_tokens: If set to -1, will use the truncation size truncate_prompt_tokens: If set to -1, will use the truncation size
supported by the model. If set to an integer k, will use only supported by the model. If set to an integer k, will use only
the last k tokens from the prompt (i.e., left truncation). the last k tokens from the prompt (i.e., left truncation).
Defaults to None (i.e., no truncation). Defaults to None (i.e., no truncation).
guided_decoding: If provided, the engine will construct a guided guided_decoding: If provided, the engine will construct a guided
decoding logits processor from these parameters. Defaults to None. decoding logits processor from these parameters. Defaults to None.