We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d14a79f commit dabbc63Copy full SHA for dabbc63
test/vllm/ec2/utils/run_vllm_on_arm64.sh
@@ -59,6 +59,7 @@ docker run --rm \
59
--entrypoint /bin/bash \
60
-e "HUGGING_FACE_HUB_TOKEN=$HF_TOKEN" \
61
-e VLLM_WORKER_MULTIPROC_METHOD=spawn \
62
+ -e VLLM_FLASH_ATTN_VERSION=2 \
63
-v "$HOME/.cache/huggingface:/root/.cache/huggingface" \
64
--gpus=all \
65
"$DLC_IMAGE" \
0 commit comments