steps: - label: "Wait for container to be ready" agents: queue: A100 plugins: - kubernetes: podSpec: containers: - image: badouralix/curl-jq command: - sh .buildkite/nightly-benchmarks/scripts/wait-for-image.sh - wait - label: "A100" agents: queue: A100 plugins: - kubernetes: podSpec: priorityClassName: perf-benchmark containers: - image: public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:$BUILDKITE_COMMIT command: - bash .buildkite/nightly-benchmarks/scripts/run-performance-benchmarks.sh resources: limits: nvidia.com/gpu: 8 volumeMounts: - name: devshm mountPath: /dev/shm env: - name: VLLM_USAGE_SOURCE value: ci-test - name: HF_TOKEN valueFrom: secretKeyRef: name: hf-token-secret key: token nodeSelector: nvidia.com/gpu.product: NVIDIA-A100-SXM4-80GB volumes: - name: devshm emptyDir: medium: Memory # - label: "H100" # agents: # queue: H100 # plugins: # - docker#v5.11.0: # image: public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:$BUILDKITE_COMMIT # command: # - bash # - .buildkite/nightly-benchmarks/run-benchmarks-suite.sh # mount-buildkite-agent: true # propagate-environment: true # ipc: host # gpus: all # environment: # - VLLM_USAGE_SOURCE # - HF_TOKEN