mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 22:44:54 +08:00
61 lines
1.6 KiB
YAML
61 lines
1.6 KiB
YAML
steps:
|
|
- label: "Wait for container to be ready"
|
|
agents:
|
|
queue: A100
|
|
plugins:
|
|
- kubernetes:
|
|
podSpec:
|
|
containers:
|
|
- image: badouralix/curl-jq
|
|
command:
|
|
- sh .buildkite/nightly-benchmarks/scripts/wait-for-image.sh
|
|
- wait
|
|
- label: "A100"
|
|
agents:
|
|
queue: A100
|
|
plugins:
|
|
- kubernetes:
|
|
podSpec:
|
|
priorityClassName: perf-benchmark
|
|
containers:
|
|
- image: public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:$BUILDKITE_COMMIT
|
|
command:
|
|
- bash .buildkite/nightly-benchmarks/scripts/run-performance-benchmarks.sh
|
|
resources:
|
|
limits:
|
|
nvidia.com/gpu: 8
|
|
volumeMounts:
|
|
- name: devshm
|
|
mountPath: /dev/shm
|
|
env:
|
|
- name: VLLM_USAGE_SOURCE
|
|
value: ci-test
|
|
- name: HF_TOKEN
|
|
valueFrom:
|
|
secretKeyRef:
|
|
name: hf-token-secret
|
|
key: token
|
|
nodeSelector:
|
|
nvidia.com/gpu.product: NVIDIA-A100-SXM4-80GB
|
|
volumes:
|
|
- name: devshm
|
|
emptyDir:
|
|
medium: Memory
|
|
# - label: "H100"
|
|
# agents:
|
|
# queue: H100
|
|
# plugins:
|
|
# - docker#v5.11.0:
|
|
# image: public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:$BUILDKITE_COMMIT
|
|
# command:
|
|
# - bash
|
|
# - .buildkite/nightly-benchmarks/run-benchmarks-suite.sh
|
|
# mount-buildkite-agent: true
|
|
# propagate-environment: true
|
|
# ipc: host
|
|
# gpus: all
|
|
# environment:
|
|
# - VLLM_USAGE_SOURCE
|
|
# - HF_TOKEN
|
|
|