Skip to content

Commit 1298a40

Browse files
authored
[ci/build] fix gh200 test (vllm-project#12681)
Signed-off-by: youkaichao <[email protected]>
1 parent ad4a9dc commit 1298a40

File tree

3 files changed

+5
-5
lines changed

3 files changed

+5
-5
lines changed

.buildkite/check-wheel-size.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,11 +4,11 @@
44
import sys
55
import zipfile
66

7-
# Read the VLLM_MAX_SIZE_MB environment variable, defaulting to 300 MiB
7+
# Read the VLLM_MAX_SIZE_MB environment variable, defaulting to 400 MiB
88
# Note that we have 400 MiB quota, please use it wisely.
99
# See https://github.com/pypi/support/issues/3792 .
1010
# Please also sync the value with the one in Dockerfile.
11-
VLLM_MAX_SIZE_MB = int(os.environ.get('VLLM_MAX_SIZE_MB', 300))
11+
VLLM_MAX_SIZE_MB = int(os.environ.get('VLLM_MAX_SIZE_MB', 400))
1212

1313

1414
def print_top_10_largest_files(zip_file):

.buildkite/run-gh200-test.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,6 @@ trap remove_docker_container EXIT
2323
remove_docker_container
2424

2525
# Run the image and test offline inference
26-
docker run --name gh200-test --gpus=all --entrypoint="" gh200-test bash -c '
27-
python3 examples/offline_inference/basic.py
26+
docker run -e HF_TOKEN -v /root/.cache/huggingface:/root/.cache/huggingface --name gh200-test --gpus=all --entrypoint="" gh200-test bash -c '
27+
python3 examples/offline_inference/cli.py --model meta-llama/Llama-3.2-1B
2828
'

Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -127,7 +127,7 @@ RUN --mount=type=cache,target=/root/.cache/ccache \
127127
# Check the size of the wheel if RUN_WHEEL_CHECK is true
128128
COPY .buildkite/check-wheel-size.py check-wheel-size.py
129129
# sync the default value with .buildkite/check-wheel-size.py
130-
ARG VLLM_MAX_SIZE_MB=300
130+
ARG VLLM_MAX_SIZE_MB=400
131131
ENV VLLM_MAX_SIZE_MB=$VLLM_MAX_SIZE_MB
132132
ARG RUN_WHEEL_CHECK=true
133133
RUN if [ "$RUN_WHEEL_CHECK" = "true" ]; then \

0 commit comments

Comments
 (0)