mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-11 07:54:57 +08:00
Speed up macOS smoke test (#28954)
Signed-off-by: Michael Goin <mgoin64@gmail.com> Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
parent
71d0ae1c54
commit
a4511e38db
7
.github/workflows/macos-smoke-test.yml
vendored
7
.github/workflows/macos-smoke-test.yml
vendored
@ -9,7 +9,7 @@ on:
|
|||||||
jobs:
|
jobs:
|
||||||
macos-m1-smoke-test:
|
macos-m1-smoke-test:
|
||||||
runs-on: macos-latest
|
runs-on: macos-latest
|
||||||
timeout-minutes: 20
|
timeout-minutes: 30
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
@ -37,15 +37,14 @@ jobs:
|
|||||||
- name: Verify installation
|
- name: Verify installation
|
||||||
run: |
|
run: |
|
||||||
python -c "import vllm; print(f'vLLM version: {vllm.__version__}')"
|
python -c "import vllm; print(f'vLLM version: {vllm.__version__}')"
|
||||||
python -c "import torch; print(f'PyTorch: {torch.__version__}')"
|
|
||||||
|
|
||||||
- name: Smoke test vllm serve
|
- name: Smoke test vllm serve
|
||||||
timeout-minutes: 10
|
|
||||||
run: |
|
run: |
|
||||||
# Start server in background
|
# Start server in background
|
||||||
vllm serve Qwen/Qwen3-0.6B \
|
vllm serve Qwen/Qwen3-0.6B \
|
||||||
--max-model-len=2048 \
|
--max-model-len=2K \
|
||||||
--load-format=dummy \
|
--load-format=dummy \
|
||||||
|
--hf-overrides '{"num_hidden_layers": 2}' \
|
||||||
--enforce-eager \
|
--enforce-eager \
|
||||||
--port 8000 &
|
--port 8000 &
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user