@@ -8,31 +8,43 @@ export LLMDBENCH_HF_TOKEN="${LLMDBENCH_HF_TOKEN:-}"
88
99# Images
1010export LLMDBENCH_IMAGE_REGISTRY=${LLMDBENCH_IMAGE_REGISTRY:- ghcr.io}
11- export LLMDBENCH_IMAGE_REPO=${LLMDBENCH_IMAGE_REPO:- llm-d/ llm-d-benchmark}
11+ export LLMDBENCH_IMAGE_REPO=${LLMDBENCH_IMAGE_REPO:- llm-d}
12+ export LLMDBENCH_IMAGE_NAME=${LLMDBENCH_IMAGE_NAME:- llm-d-benchmark}
1213export LLMDBENCH_IMAGE_TAG=${LLMDBENCH_IMAGE_TAG:- auto}
1314export LLMDBENCH_LLMD_IMAGE_REGISTRY=${LLMDBENCH_LLMD_IMAGE_REGISTRY:- ghcr.io}
14- export LLMDBENCH_LLMD_IMAGE_REPO=${LLMDBENCH_LLMD_IMAGE_REPO:- llm-d/ llm-d}
15+ export LLMDBENCH_LLMD_IMAGE_REPO=${LLMDBENCH_LLMD_IMAGE_REPO:- llm-d}
16+ export LLMDBENCH_LLMD_IMAGE_NAME=${LLMDBENCH_LLMD_IMAGE_REPO:- llm-d}
1517export LLMDBENCH_LLMD_IMAGE_TAG=${LLMDBENCH_LLMD_IMAGE_TAG:- 0.0.8}
1618export LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REGISTRY=${LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REGISTRY:- ghcr.io}
17- export LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REPO=${LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REPO:- llm-d/ llm-d-model-service}
19+ export LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REPO=${LLMDBENCH_LLMD_MODELSERVICE_IMAGE_REPO:- llm-d}
20+ export LLMDBENCH_LLMD_MODELSERVICE_IMAGE_NAME=${LLMDBENCH_LLMD_MODELSERVICE_IMAGE_NAME:- llm-d-model-service}
1821export LLMDBENCH_LLMD_MODELSERVICE_IMAGE_TAG=${LLMDBENCH_LLMD_MODELSERVICE_IMAGE_TAG:- 0.0.10}
1922export LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REGISTRY=${LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REGISTRY:- ghcr.io}
20- export LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REPO=${LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REPO:- llm-d/ llm-d-inference-scheduler}
23+ export LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REPO=${LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_REPO:- llm-d}
24+ export LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_NAME=${LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_NAME:- llm-d-inference-scheduler}
2125export LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_TAG=${LLMDBENCH_LLMD_INFERENCESCHEDULER_IMAGE_TAG:- 0.0.4}
2226export LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REGISTRY=${LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REGISTRY:- ghcr.io}
23- export LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REPO=${LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REPO:- llm-d/ llm-d-routing-sidecar}
27+ export LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REPO=${LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_REPO:- llm-d}
28+ export LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_NAME=${LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_NAME:- llm-d-routing-sidecar}
2429export LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_TAG=${LLMDBENCH_LLMD_ROUTINGSIDECAR_IMAGE_TAG:- 0.0.6}
2530export LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REGISTRY=${LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REGISTRY:- ghcr.io}
26- export LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REPO=${LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REPO:- llm-d/ llm-d-inference-sim}
31+ export LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REPO=${LLMDBENCH_LLMD_INFERENCESIM_IMAGE_REPO:- llm-d}
32+ export LLMDBENCH_LLMD_INFERENCESIM_IMAGE_NAME=${LLMDBENCH_LLMD_INFERENCESIM_IMAGE_NAME:- llm-d-inference-sim}
2733export LLMDBENCH_LLMD_INFERENCESIM_IMAGE_TAG=${LLMDBENCH_LLMD_INFERENCESIM_IMAGE_TAG:- v0.1.2}
28- export LLMDBENCH_VLLM_STANDALONE_IMAGE_REGISTRY=${LLMDBENCH_VLLM_STANDALONE_IMAGE_REGISTRY:- vllm}
29- export LLMDBENCH_VLLM_STANDALONE_IMAGE_REPO=${LLMDBENCH_VLLM_STANDALONE_IMAGE_REPO:- vllm-openai}
34+ export LLMDBENCH_VLLM_STANDALONE_IMAGE_REGISTRY=${LLMDBENCH_VLLM_STANDALONE_IMAGE_REGISTRY:- docker.io}
35+ export LLMDBENCH_VLLM_STANDALONE_IMAGE_REPO=${LLMDBENCH_VLLM_STANDALONE_IMAGE_REPO:- vllm}
36+ export LLMDBENCH_VLLM_STANDALONE_IMAGE_NAME=${LLMDBENCH_VLLM_STANDALONE_IMAGE_NAME:- vllm-openai}
3037export LLMDBENCH_VLLM_STANDALONE_IMAGE_TAG=${LLMDBENCH_VLLM_STANDALONE_IMAGE_TAG:- latest}
3138
3239# External repositories
3340export LLMDBENCH_DEPLOYER_GIT_REPO=" ${LLMDBENCH_DEPLOYER_GIT_REPO:- https:// github.com/ llm-d/ llm-d-deployer.git} "
3441export LLMDBENCH_DEPLOYER_DIR=" ${LLMDBENCH_DEPLOYER_DIR:-/ tmp} "
3542export LLMDBENCH_DEPLOYER_GIT_BRANCH=" ${LLMDBENCH_DEPLOYER_GIT_BRANCH:- main} "
43+
44+ export LLMDBENCH_INFRA_GIT_REPO=" ${LLMDBENCH_INFRA_GIT_REPO:- https:// github.com/ llm-d-incubation/ llm-d-infra.git} "
45+ export LLMDBENCH_INFRA_DIR=" ${LLMDBENCH_INFRA_DIR:-/ tmp} "
46+ export LLMDBENCH_INFRA_GIT_BRANCH=" ${LLMDBENCH_INFRA_GIT_BRANCH:- main} "
47+
3648export LLMDBENCH_HARNESS_GIT_REPO=" ${LLMDBENCH_HARNESS_GIT_REPO:- auto} "
3749export LLMDBENCH_HARNESS_DIR=" ${LLMDBENCH_HARNESS_DIR:-/ tmp} "
3850export LLMDBENCH_HARNESS_GIT_BRANCH=" ${LLMDBENCH_HARNESS_GIT_BRANCH:- main} "
@@ -42,6 +54,8 @@ export LLMDBENCH_VLLM_COMMON_NAMESPACE="${LLMDBENCH_VLLM_COMMON_NAMESPACE:-llmdb
4254export LLMDBENCH_VLLM_COMMON_SERVICE_ACCOUNT=" ${LLMDBENCH_VLLM_COMMON_SERVICE_ACCOUNT:- default} "
4355
4456export LLMDBENCH_VLLM_COMMON_ACCELERATOR_RESOURCE=${LLMDBENCH_VLLM_COMMON_ACCELERATOR_RESOURCE:- nvidia.com/ gpu}
57+ export LLMDBENCH_VLLM_COMMON_NETWORK_RESOURCE=${LLMDBENCH_VLLM_COMMON_NETWORK_RESOURCE:- }
58+ export LLMDBENCH_VLLM_COMMON_NETWORK_NR=${LLMDBENCH_VLLM_COMMON_NETWORK_NR:- }
4559export LLMDBENCH_VLLM_COMMON_AFFINITY=${LLMDBENCH_VLLM_COMMON_AFFINITY:- ${LLMDBENCH_VLLM_COMMON_ACCELERATOR_RESOURCE} .product: NVIDIA-H100-80GB-HBM3}
4660export LLMDBENCH_VLLM_COMMON_REPLICAS=${LLMDBENCH_VLLM_COMMON_REPLICAS:- 1}
4761export LLMDBENCH_VLLM_COMMON_PERSISTENCE_ENABLED=${LLMDBENCH_VLLM_COMMON_PERSISTENCE_ENABLED:- true}
@@ -79,16 +93,34 @@ export LLMDBENCH_VLLM_STANDALONE_EPHEMERAL_STORAGE=${LLMDBENCH_VLLM_STANDALONE_E
7993export LLMDBENCH_VLLM_DEPLOYER_VALUES_FILE=${LLMDBENCH_VLLM_DEPLOYER_VALUES_FILE:- " fromenv" }
8094export LLMDBENCH_VLLM_DEPLOYER_PREFILL_REPLICAS=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_REPLICAS:- 1}
8195export LLMDBENCH_VLLM_DEPLOYER_PREFILL_EXTRA_ARGS=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_EXTRA_ARGS:- " [--disable-log-requests]" }
96+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_ACCELERATOR_NR=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_ACCELERATOR_NR:- $LLMDBENCH_VLLM_COMMON_ACCELERATOR_NR }
97+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_ACCELERATOR_MEM_UTIL=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_ACCELERATOR_MEM_UTIL:- $LLMDBENCH_VLLM_COMMON_ACCELERATOR_MEM_UTIL }
98+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_NETWORK_RESOURCE=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_NETWORK_RESOURCE:- $LLMDBENCH_VLLM_COMMON_NETWORK_RESOURCE }
99+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_NETWORK_NR=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_NETWORK_NR:- $LLMDBENCH_VLLM_COMMON_NETWORK_NR }
100+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_CPU_NR=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_CPU_NR:- $LLMDBENCH_VLLM_COMMON_CPU_NR }
101+ export LLMDBENCH_VLLM_DEPLOYER_PREFILL_CPU_MEM=${LLMDBENCH_VLLM_DEPLOYER_PREFILL_CPU_MEM:- $LLMDBENCH_VLLM_COMMON_CPU_MEM }
82102export LLMDBENCH_VLLM_DEPLOYER_DECODE_REPLICAS=${LLMDBENCH_VLLM_DEPLOYER_DECODE_REPLICAS:- 1}
83103export LLMDBENCH_VLLM_DEPLOYER_DECODE_EXTRA_ARGS=${LLMDBENCH_VLLM_DEPLOYER_DECODE_EXTRA_ARGS:- " [--disable-log-requests]" }
84- export LLMDBENCH_VLLM_DEPLOYER_BASECONFIGMAPREFNAME=${LLMDBENCH_VLLM_DEPLOYER_BASECONFIGMAPREFNAME:- " basic-gpu-with-nixl-and-redis-lookup-preset" }
85- export LLMDBENCH_VLLM_DEPLOYER_MODELSERVICE_REPLICAS=${LLMDBENCH_VLLM_DEPLOYER_MODELSERVICE_REPLICAS:- 1}
86- export LLMDBENCH_VLLM_DEPLOYER_ROUTE=${LLMDBENCH_VLLM_DEPLOYER_ROUTE:- 1}
104+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_ACCELERATOR_NR=${LLMDBENCH_VLLM_DEPLOYER_DECODE_ACCELERATOR_NR:- $LLMDBENCH_VLLM_COMMON_ACCELERATOR_NR }
105+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_ACCELERATOR_MEM_UTIL=${LLMDBENCH_VLLM_DEPLOYER_DECODE_ACCELERATOR_MEM_UTIL:- $LLMDBENCH_VLLM_COMMON_ACCELERATOR_MEM_UTIL }
106+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_NETWORK_RESOURCE=${LLMDBENCH_VLLM_DEPLOYER_DECODE_NETWORK_RESOURCE:- $LLMDBENCH_VLLM_COMMON_NETWORK_RESOURCE }
107+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_NETWORK_NR=${LLMDBENCH_VLLM_DEPLOYER_DECODE_NETWORK_NR:- $LLMDBENCH_VLLM_COMMON_NETWORK_NR }
108+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_CPU_NR=${LLMDBENCH_VLLM_DEPLOYER_DECODE_CPU_NR:- $LLMDBENCH_VLLM_COMMON_CPU_NR }
109+ export LLMDBENCH_VLLM_DEPLOYER_DECODE_CPU_MEM=${LLMDBENCH_VLLM_DEPLOYER_DECODE_CPU_MEM:- $LLMDBENCH_VLLM_COMMON_CPU_MEM }
87110export LLMDBENCH_VLLM_DEPLOYER_GATEWAY_CLASS_NAME=${LLMDBENCH_VLLM_DEPLOYER_GATEWAY_CLASS_NAME:- kgateway}
88111export LLMDBENCH_VLLM_DEPLOYER_RELEASE=${LLMDBENCH_VLLM_DEPLOYER_RELEASE:- " llm-d" }
112+ export LLMDBENCH_VLLM_DEPLOYER_ROUTE=${LLMDBENCH_VLLM_DEPLOYER_ROUTE:- 1}
113+
114+ # FIXME (start) delete after removal of llm-d-deployer
115+ export LLMDBENCH_VLLM_DEPLOYER_BASECONFIGMAPREFNAME=${LLMDBENCH_VLLM_DEPLOYER_BASECONFIGMAPREFNAME:- " basic-gpu-with-nixl-and-redis-lookup-preset" }
116+ export LLMDBENCH_VLLM_DEPLOYER_MODELSERVICE_REPLICAS=${LLMDBENCH_VLLM_DEPLOYER_MODELSERVICE_REPLICAS:- 1}
89117export LLMDBENCH_VLLM_DEPLOYER_RECONFIGURE_GATEWAY_AFTER_DEPLOY=${LLMDBENCH_VLLM_DEPLOYER_RECONFIGURE_GATEWAY_AFTER_DEPLOY:- 0}
118+ # FIXME (end) delete after removal of llm-d-deployer
90119
91120# Endpoint Picker Parameters, Deployer-specific
121+ export LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS=${LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS:- " default" }
122+
123+ # FIXME (start) delete after removal of llm-d-deployer
92124export LLMDBENCH_VLLM_DEPLOYER_EPP_ENABLE_KVCACHE_AWARE_SCORER=${LLMDBENCH_VLLM_DEPLOYER_EPP_ENABLE_KVCACHE_AWARE_SCORER:- false}
93125export LLMDBENCH_VLLM_DEPLOYER_EPP_KVCACHE_AWARE_SCORER_WEIGHT=${LLMDBENCH_VLLM_DEPLOYER_EPP_KVCACHE_AWARE_SCORER_WEIGHT:- 1}
94126export LLMDBENCH_VLLM_DEPLOYER_EPP_ENABLE_PREFIX_AWARE_SCORER=${LLMDBENCH_VLLM_DEPLOYER_EPP_ENABLE_PREFIX_AWARE_SCORER:- true}
@@ -115,6 +147,7 @@ export LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_ENABLE_PREFIX_AWARE_SCORER=${LLMDBENCH
115147export LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_PREFIX_AWARE_SCORER_WEIGHT=${LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_PREFIX_AWARE_SCORER_WEIGHT:- 1}
116148export LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_ENABLE_SESSION_AWARE_SCORER=${LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_ENABLE_SESSION_AWARE_SCORER:- false}
117149export LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_SESSION_AWARE_SCORER_WEIGHT=${LLMDBENCH_VLLM_DEPLOYER_EPP_DECODE_SESSION_AWARE_SCORER_WEIGHT:- 1}
150+ # FIXME (end) delete after removal of llm-d-deployer
118151
119152# Modelservice (helm chart) specific parameters
120153export LLMDBENCH_VLLM_MODELSERVICE_VALUES_FILE=${LLMDBENCH_VLLM_MODELSERVICE_VALUES_FILE:- " default-values.yaml" }
@@ -182,12 +215,15 @@ function model_attribute {
182215 esac
183216
184217 local modelcomponents=$( echo $model | cut -d ' /' -f 2 | tr ' [:upper:]' ' [:lower:]' | $LLMDBENCH_CONTROL_SCMD -e ' s^qwen^qwen-^g' -e ' s^-^\n^g' )
218+ local provider=$( echo $model | cut -d ' /' -f 1)
185219 local type=$( echo " ${modelcomponents} " | grep -Ei " nstruct|hf|chat|speech|vision" )
186- local parameters=$( echo " ${modelcomponents} " | grep -Ei " [0-9].*b" | $LLMDBENCH_CONTROL_SCMD -e ' s^a^^' -e ' s^\.^p^' )
187- local majorversion=$( echo " ${modelcomponents} " | grep -Ei " ^[0-9]" | grep -Evi " b|E" | cut -d ' .' -f 1)
220+ local parameters=$( echo " ${modelcomponents} " | grep -Ei " [0-9].*b|[0-9].*m " | $LLMDBENCH_CONTROL_SCMD -e ' s^a^^' -e ' s^\.^p^' )
221+ local majorversion=$( echo " ${modelcomponents} " | grep -Ei " ^[0-9]" | grep -Evi " b|E" | $LLMDBENCH_CONTROL_SCMD -e " s/ $parameters //g " | cut -d ' .' -f 1)
188222 local kind=$( echo " ${modelcomponents} " | head -n 1 | cut -d ' /' -f 1)
189- local label=${kind} -${majorversion} -${parameters}
190223 local as_label=$( echo $model | tr ' [:upper:]' ' [:lower:]' | $LLMDBENCH_CONTROL_SCMD -e " s^/^-^g" )
224+ local label=$( echo ${kind} -${majorversion} -${parameters} | $LLMDBENCH_CONTROL_SCMD -e ' s^-$^^g' -e ' s^--^^g' )
225+ local as_label=$( echo $model | tr ' [:upper:]' ' [:lower:]' | $LLMDBENCH_CONTROL_SCMD -e " s^/^-^g" -e " s^\.^-^g" )
226+ local folder=$( echo $model | tr ' [:upper:]' ' [:lower:]' | $LLMDBENCH_CONTROL_SCMD -e ' s^/^_^g' -e ' s^-^_^g' )
191227
192228 if [[ $attribute != " model" ]];
193229 then
@@ -255,45 +291,29 @@ else
255291 fi
256292fi
257293
258- if [[ $LLMDBENCH_CONTROL_DEPENDENCIES_CHECKED -eq 0 && ! -f ~ /.llmdbench_dependencies_checked ]]
259- then
260- deplist=" $LLMDBENCH_CONTROL_SCMD $LLMDBENCH_CONTROL_PCMD $LLMDBENCH_CONTROL_KCMD $LLMDBENCH_CONTROL_HCMD kubectl kustomize rsync"
261- echo " Checking dependencies \" $deplist \" "
262- for req in $deplist kubectl kustomize; do
263- echo -n " Checking dependency \" ${req} \" ..."
264- is_req=$( which ${req} || true)
265- if [[ -z ${is_req} ]]; then
266- echo " ❌ Dependency \" ${req} \" is missing"
267- exit 1
268- fi
269- echo " done"
270- done
271- touch ~ /.llmdbench_dependencies_checked
272- export LLMDBENCH_CONTROL_DEPENDENCIES_CHECKED=1
273- fi
274-
275294function get_image {
276295 local image_registry=$1
277296 local image_repo=$2
278- local image_tag=$3
279- local tag_only=${4:- 0}
297+ local image_name=$3
298+ local image_tag=$4
299+ local tag_only=${5:- 0}
280300
281301 is_latest_tag=$image_tag
282302 if [[ $image_tag == " auto" ]]; then
283303 if [[ $LLMDBENCH_CONTROL_CCMD == " podman" ]]; then
284- is_latest_tag=$( $LLMDBENCH_CONTROL_CCMD search --list-tags ${image_registry} /${image_repo} | tail -1 | awk ' { print $2 }' || true)
304+ is_latest_tag=$( $LLMDBENCH_CONTROL_CCMD search --list-tags ${image_registry} /${image_repo} / ${image_name} | tail -1 | awk ' { print $2 }' || true)
285305 else
286- is_latest_tag=$( skopeo list-tags docker://${image_registry} /${image_repo} | jq -r .Tags[] | tail -1)
306+ is_latest_tag=$( skopeo list-tags docker://${image_registry} /${image_repo} / ${image_name} | jq -r .Tags[] | tail -1)
287307 fi
288308 if [[ -z ${is_latest_tag} ]]; then
289- echo " ❌ Unable to find latest tag for image \" ${image_registry} /${image_repo} \" "
309+ echo " ❌ Unable to find latest tag for image \" ${image_registry} /${image_repo} / ${image_name} \" "
290310 exit 1
291311 fi
292312 fi
293313 if [[ $tag_only -eq 1 ]]; then
294314 echo ${is_latest_tag}
295315 else
296- echo $image_registry /$image_repo :${is_latest_tag}
316+ echo $image_registry /$image_repo / ${image_name} :${is_latest_tag}
297317 fi
298318}
299319
@@ -321,6 +341,18 @@ if [[ ! -z $LLMDBENCH_DEPLOY_SCENARIO ]]; then
321341 fi
322342fi
323343
344+ if [[ " $LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS " == /* ]]; then
345+ export LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS_FULL_PATH=$( echo $LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS ' .yaml' | $LLMDBENCH_CONTROL_SCMD ' s^.yaml.yaml^.yaml^g' )
346+ else
347+ export LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS_FULL_PATH=$( echo ${LLMDBENCH_MAIN_DIR} /setup/presets/gaie/$LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS ' .yaml' | $LLMDBENCH_CONTROL_SCMD ' s^.yaml.yaml^.yaml^g' )
348+ fi
349+ if [[ ! -f $LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS_FULL_PATH ]]; then
350+ echo " ❌ GAIE presets file \" $LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS_FULL_PATH \" could not be found."
351+ exit 1
352+ else
353+ export LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS=$( echo $LLMDBENCH_VLLM_DEPLOYER_GAIE_PRESETS_FULL_PATH | rev | cut -d ' /' -f 1 | rev)
354+ fi
355+
324356overridevarlist=$( env | grep _CLIOVERRIDE_ | cut -d ' =' -f 1 || true)
325357if [[ -n " $overridevarlist " ]]; then
326358 for overridevar in $overridevarlist ; do
@@ -356,6 +388,7 @@ export LLMDBENCH_CONTROL_WORK_DIR_SET=${LLMDBENCH_CONTROL_WORK_DIR_SET:-0}
356388
357389function prepare_work_dir {
358390 mkdir -p ${LLMDBENCH_CONTROL_WORK_DIR} /setup/yamls
391+ mkdir -p ${LLMDBENCH_CONTROL_WORK_DIR} /setup/helm
359392 mkdir -p ${LLMDBENCH_CONTROL_WORK_DIR} /setup/commands
360393 mkdir -p ${LLMDBENCH_CONTROL_WORK_DIR} /environment
361394 mkdir -p ${LLMDBENCH_CONTROL_WORK_DIR} /workload/harnesses
@@ -746,9 +779,9 @@ create_or_update_hf_secret() {
746779}
747780export -f create_or_update_hf_secret
748781
749- #
782+ #
750783# vLLM Model Download Utilities
751- #
784+ #
752785
753786validate_and_create_pvc () {
754787 local kcmd=" $1 "
@@ -882,7 +915,7 @@ wait_for_download_job() {
882915 announce " 🙀 Pod did not become Ready"
883916 llmdbench_execute_cmd " ${kcmd} logs job/download-model -n ${namespace} " ${LLMDBENCH_CONTROL_DRY_RUN} ${LLMDBENCH_CONTROL_VERBOSE} 0 1 0
884917 exit 1
885- fi
918+ fi
886919
887920 announce " ⏳ Waiting up to ${timeout} s for job to complete..."
888921 llmdbench_execute_cmd " ${kcmd} wait --for=condition=complete --timeout=" ${timeout} " s job/download-model -n ${namespace} " ${LLMDBENCH_CONTROL_DRY_RUN} ${LLMDBENCH_CONTROL_VERBOSE}
0 commit comments