From 08ff2e4d33cdad0605bdd093310b2d4bd63ddf9b Mon Sep 17 00:00:00 2001 From: hiento09 Date: Tue, 12 Aug 2025 10:17:55 +0700 Subject: [PATCH] chore: update jan inference model Dockerfile cmd --- apps/jan-inference-model/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/apps/jan-inference-model/Dockerfile b/apps/jan-inference-model/Dockerfile index 657204c3..274256b2 100644 --- a/apps/jan-inference-model/Dockerfile +++ b/apps/jan-inference-model/Dockerfile @@ -6,4 +6,4 @@ RUN pip install --no-cache-dir huggingface_hub \ EXPOSE 8101 -CMD ["--model", "Qwen/Qwen3-4B", "--host", "0.0.0.0", "--port", "8101"] \ No newline at end of file +CMD ["--model", "Qwen/Qwen3-4B", "--host", "0.0.0.0", "--port", "8101", "--gpu-memory-utilization", "0.65", "--enforce-eager", "--max_model_len", "32768"] \ No newline at end of file