We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 028dc61 + d82751d commit a645748Copy full SHA for a645748
docker/vllm.Dockerfile
@@ -1,4 +1,4 @@
1
-FROM vllm/vllm-openai:v0.10.1
+FROM vllm/vllm-openai:v0.11.2
2
3
# # Specify model name and path during build
4
# ARG MODEL_NAME=llama_1b_cpu
@@ -9,6 +9,7 @@ FROM vllm/vllm-openai:v0.10.1
9
# ENV MODEL_PATH=${MODEL_PATH}
10
# ENV EXEC_PATH=nilai_models.models.${MODEL_NAME}:app
11
12
+ENV PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
13
COPY --link . /daemon/
14
COPY --link vllm_templates /opt/vllm/templates
15
0 commit comments