mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 07:24:56 +08:00
[CI] Shard tests for LoRA and Kernels to speed up (#3445)
This commit is contained in:
parent
abfc4f3387
commit
93348d9458
@ -33,9 +33,9 @@ steps:
|
||||
- label: Entrypoints Test
|
||||
command: pytest -v -s entrypoints
|
||||
|
||||
- label: Kernels Test
|
||||
command: pytest -v -s kernels
|
||||
soft_fail: true
|
||||
- label: Kernels Test %N
|
||||
command: pytest -v -s kernels --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT
|
||||
parallelism: 4
|
||||
|
||||
- label: Models Test
|
||||
commands:
|
||||
@ -55,8 +55,9 @@ steps:
|
||||
- label: Speculative decoding tests
|
||||
command: pytest -v -s spec_decode
|
||||
|
||||
- label: LoRA Test
|
||||
command: pytest -v -s lora --forked
|
||||
- label: LoRA Test %N
|
||||
command: pytest -v -s lora --forked --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT
|
||||
parallelism: 4
|
||||
|
||||
- label: Metrics Test
|
||||
command: pytest -v -s metrics
|
||||
|
||||
@ -20,6 +20,9 @@ steps:
|
||||
agents:
|
||||
queue: kubernetes
|
||||
soft_fail: {{ step.soft_fail or false }}
|
||||
{% if step.parallelism %}
|
||||
parallelism: {{ step.parallelism }}
|
||||
{% endif %}
|
||||
retry:
|
||||
automatic:
|
||||
- exit_status: -1 # Agent was lost
|
||||
|
||||
@ -16,6 +16,7 @@ pytest
|
||||
pytest-forked
|
||||
pytest-asyncio
|
||||
pytest-rerunfailures
|
||||
pytest-shard
|
||||
httpx
|
||||
einops # required for MPT
|
||||
openai
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user