Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion deploy/install.sh
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ CONTROLLER_INSTANCE=${CONTROLLER_INSTANCE:-""}
# llm-d Configuration
LLM_D_OWNER=${LLM_D_OWNER:-"llm-d"}
LLM_D_PROJECT=${LLM_D_PROJECT:-"llm-d"}
LLM_D_RELEASE=${LLM_D_RELEASE:-"v0.3.0"}
LLM_D_RELEASE=${LLM_D_RELEASE:-"main"}
LLM_D_MODELSERVICE_NAME=${LLM_D_MODELSERVICE_NAME:-"ms-$WELL_LIT_PATH_NAME-llm-d-modelservice"}
LLM_D_EPP_NAME=${LLM_D_EPP_NAME:-"gaie-$WELL_LIT_PATH_NAME-epp"}
CLIENT_PREREQ_DIR=${CLIENT_PREREQ_DIR:-"$WVA_PROJECT/$LLM_D_PROJECT/guides/prereq/client-setup"}
Expand Down
29 changes: 29 additions & 0 deletions deploy/lib/infra_llmd.sh
Original file line number Diff line number Diff line change
Expand Up @@ -328,6 +328,35 @@ deploy_llm_d_infrastructure() {
else
log_warning "ConfigMap $LLM_D_EPP_NAME not found in $LLMD_NS"
fi

# Ensure EPP has RBAC for InferenceModelRewrite (required by EPP v0.7.0+
# which watches this CRD, but older inferencepool Helm charts don't include it).
log_info "Ensuring EPP RBAC includes inferencemodelrewrites permission"
kubectl apply -f - <<RBAC_EOF
apiVersion: rbac.authorization.k8s.io/v1
kind: Role
metadata:
name: ${LLM_D_EPP_NAME}-model-rewrite
namespace: ${LLMD_NS}
rules:
- apiGroups: ["inference.networking.x-k8s.io"]
resources: ["inferencemodelrewrites"]
verbs: ["get", "list", "watch"]
---
apiVersion: rbac.authorization.k8s.io/v1
kind: RoleBinding
metadata:
name: ${LLM_D_EPP_NAME}-model-rewrite
namespace: ${LLMD_NS}
subjects:
- kind: ServiceAccount
name: ${LLM_D_EPP_NAME}
namespace: ${LLMD_NS}
roleRef:
apiGroup: rbac.authorization.k8s.io
kind: Role
name: ${LLM_D_EPP_NAME}-model-rewrite
RBAC_EOF
else
log_warning "Skipping inference-scheduler patch: Deployment $LLM_D_EPP_NAME not found in $LLMD_NS"
fi
Expand Down
Loading