Skip to content

Commit 24d87fb

Browse files
committed
Remove old charts and update CI workflows for unified fma-controllers chart
Update 142pm EST: Resolved conflicts on CI for OpenShift. Delete charts/dual-pods-controller/ and charts/launcher-populator/ directories. Update CI workflows to use the new chart path, deployment names, and label selectors. Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com> Signed-off-by: Gloire Rubambiza <gloire@ibm.com>
1 parent 69a28bc commit 24d87fb

20 files changed

+37
-397
lines changed

.github/workflows/ci-e2e-openshift.yaml

Lines changed: 20 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -476,35 +476,37 @@ jobs:
476476
echo " Image: $CONTROLLER_IMAGE"
477477
echo " EnableValidationPolicy: $POLICIES_ENABLED"
478478
479-
helm upgrade --install "$FMA_RELEASE_NAME" charts/dual-pods-controller \
479+
helm upgrade --install "$FMA_RELEASE_NAME" charts/fma-controllers \
480480
-n "$FMA_NAMESPACE" \
481-
--set Image="$CONTROLLER_IMAGE" \
482-
--set NodeViewClusterRole=fma-node-viewer \
483-
--set SleeperLimit=2 \
484-
--set Local=false \
485-
--set DebugAcceleratorMemory=false \
486-
--set EnableValidationPolicy="$POLICIES_ENABLED"
481+
--set dualPodsController.image.repository="${CONTROLLER_IMAGE%:*}" \
482+
--set dualPodsController.image.tag="${CONTROLLER_IMAGE##*:}" \
483+
--set global.nodeViewClusterRole=fma-node-viewer \
484+
--set dualPodsController.sleeperLimit=2 \
485+
--set global.local=false \
486+
--set dualPodsController.debugAcceleratorMemory=false \
487+
--set global.enableValidationPolicy="$POLICIES_ENABLED" \
488+
--set launcherPopulator.enabled=false
487489
488490
- name: Wait for controller to be ready
489491
run: |
490492
echo "Waiting for FMA controller deployment to be ready..."
491493
kubectl wait --for=condition=available --timeout=120s \
492-
deployment "$FMA_RELEASE_NAME" -n "$FMA_NAMESPACE"
494+
deployment "$FMA_RELEASE_NAME-dual-pods-controller" -n "$FMA_NAMESPACE"
493495
494496
echo ""
495497
echo "=== Controller Pod Status ==="
496-
kubectl get pods -n "$FMA_NAMESPACE" -l app.kubernetes.io/name=dual-pods
498+
kubectl get pods -n "$FMA_NAMESPACE" -l app.kubernetes.io/name=fma-controllers
497499
echo ""
498500
echo "=== Controller Deployment ==="
499-
kubectl get deployment "$FMA_RELEASE_NAME" -n "$FMA_NAMESPACE"
501+
kubectl get deployment "$FMA_RELEASE_NAME-dual-pods-controller" -n "$FMA_NAMESPACE"
500502
501503
- name: Verify controller health
502504
run: |
503505
echo "Checking controller pod for issues..."
504506
505507
# Get the controller pod name
506508
POD_NAME=$(kubectl get pods -n "$FMA_NAMESPACE" \
507-
-l app.kubernetes.io/name=dual-pods,app.kubernetes.io/component=controller \
509+
-l app.kubernetes.io/name=fma-controllers,app.kubernetes.io/component=dual-pods-controller \
508510
-o jsonpath='{.items[0].metadata.name}')
509511
510512
if [ -z "$POD_NAME" ]; then
@@ -910,7 +912,7 @@ jobs:
910912
if: failure()
911913
run: |
912914
echo "Test failed - scaling down controller to free resources while preserving for debugging..."
913-
kubectl scale deployment "$FMA_RELEASE_NAME" -n "$FMA_NAMESPACE" --replicas=0 || true
915+
kubectl scale deployment "$FMA_RELEASE_NAME-dual-pods-controller" -n "$FMA_NAMESPACE" --replicas=0 || true
914916
915917
echo ""
916918
echo "=== Remaining resources for debugging ==="
@@ -923,13 +925,13 @@ jobs:
923925
echo "=== Events ==="
924926
kubectl get events -n "$FMA_NAMESPACE" --sort-by='.lastTimestamp' 2>/dev/null | tail -30 || true
925927
echo ""
926-
echo "=== Full controller logs ==="
927-
kubectl logs deployment/"$FMA_RELEASE_NAME" -n "$FMA_NAMESPACE" --previous 2>/dev/null || true
928-
kubectl logs deployment/"$FMA_RELEASE_NAME" -n "$FMA_NAMESPACE" 2>/dev/null || true
928+
echo "=== Dual Pods controller logs ==="
929+
kubectl logs deployment/"$FMA_RELEASE_NAME-dual-pods-controller" -n "$FMA_NAMESPACE" --previous 2>/dev/null || true
930+
kubectl logs deployment/"$FMA_RELEASE_NAME-dual-pods-controller" -n "$FMA_NAMESPACE" 2>/dev/null || true
929931
echo ""
930-
echo "=== Launcher-populator logs ==="
931-
kubectl logs deployment/launcher-populator -n "$FMA_NAMESPACE" --previous 2>/dev/null || true
932-
kubectl logs deployment/launcher-populator -n "$FMA_NAMESPACE" 2>/dev/null || true
932+
echo "=== Launcher-populator controller logs ==="
933+
kubectl logs deployment/"$FMA_RELEASE_NAME-launcher-populator" -n "$FMA_NAMESPACE" --previous 2>/dev/null || true
934+
kubectl logs deployment/"$FMA_RELEASE_NAME-launcher-populator" -n "$FMA_NAMESPACE" 2>/dev/null || true
933935
934936
# Report status back to PR for issue_comment triggered runs
935937
# This ensures fork PRs show the correct status after /ok-to-test runs complete

.github/workflows/launcher-based-e2e-test.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -70,11 +70,11 @@ jobs:
7070

7171
- name: show dual-pods controller log
7272
if: always()
73-
run: kubectl logs deploy/dpctlr
73+
run: kubectl logs deploy/dpctlr-dual-pods-controller
7474

7575
- name: show launcher-populator log
7676
if: always()
77-
run: kubectl logs deploy/launcher-populator || echo "launcher-populator not deployed"
77+
run: kubectl logs deploy/dpctlr-launcher-populator || echo "launcher-populator not deployed"
7878

7979
- name: show GPU allocations
8080
if: always()

.github/workflows/pr-test-in-kind.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ jobs:
6161

6262
- name: show dual-pods controller log
6363
if: always()
64-
run: kubectl logs deploy/dpctlr
64+
run: kubectl logs deploy/dpctlr-dual-pods-controller
6565

6666
- name: show GPU allocations
6767
if: always()

.github/workflows/publish-release.yaml

Lines changed: 14 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -130,20 +130,21 @@ jobs:
130130
TAG="${{ steps.version.outputs.tag }}"
131131
reg="${{ github.repository }}"
132132
133-
# Update dual-pods-controller chart values
134-
DPCTLR_CHART="charts/dual-pods-controller"
135-
yq eval -i ".Image = \"ghcr.io/${reg@L}/dual-pods-controller:${TAG}\"" $DPCTLR_CHART/values.yaml
133+
CHART="charts/fma-controllers"
136134
137-
echo "Updated $DPCTLR_CHART/values.yaml:"
138-
yq eval '.Image' $DPCTLR_CHART/values.yaml
135+
# Update dual-pods-controller image
136+
yq eval -i ".dualPodsController.image.repository = \"ghcr.io/${reg@L}/dual-pods-controller\"" $CHART/values.yaml
137+
yq eval -i ".dualPodsController.image.tag = \"${TAG}\"" $CHART/values.yaml
139138
140-
# Update launcher-populator chart values
141-
POPULATOR_CHART="charts/launcher-populator"
142-
yq eval -i ".image.repository = \"ghcr.io/${reg@L}/launcher-populator\"" $POPULATOR_CHART/values.yaml
143-
yq eval -i ".image.tag = \"${TAG}\"" $POPULATOR_CHART/values.yaml
139+
echo "Updated dual-pods-controller image:"
140+
yq eval '.dualPodsController.image' $CHART/values.yaml
144141
145-
echo "Updated $POPULATOR_CHART/values.yaml:"
146-
yq eval '.image' $POPULATOR_CHART/values.yaml
142+
# Update launcher-populator image
143+
yq eval -i ".launcherPopulator.image.repository = \"ghcr.io/${reg@L}/launcher-populator\"" $CHART/values.yaml
144+
yq eval -i ".launcherPopulator.image.tag = \"${TAG}\"" $CHART/values.yaml
145+
146+
echo "Updated launcher-populator image:"
147+
yq eval '.launcherPopulator.image' $CHART/values.yaml
147148
148149
# -----------------------------------------
149150
# 10. Login to GHCR for Helm
@@ -198,10 +199,8 @@ jobs:
198199
echo " • ghcr.io/${reg@L}/requester:$TAG"
199200
echo ""
200201
echo "Helm Charts (version $VERSION):"
201-
echo " • oci://ghcr.io/${reg@L}/charts/dual-pods-controller"
202-
echo " • oci://ghcr.io/${reg@L}/charts/launcher-populator"
202+
echo " • oci://ghcr.io/${reg@L}/charts/fma-controllers"
203203
echo ""
204204
echo "Install with:"
205-
echo " helm install dpctlr oci://ghcr.io/${reg@L}/charts/dual-pods-controller --version $VERSION"
206-
echo " helm install launcher-populator oci://ghcr.io/${reg@L}/charts/launcher-populator --version $VERSION"
205+
echo " helm install dpctlr oci://ghcr.io/${reg@L}/charts/fma-controllers --version $VERSION"
207206
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"

charts/dual-pods-controller/Chart.yaml

Lines changed: 0 additions & 16 deletions
This file was deleted.

charts/dual-pods-controller/templates/deployment.yaml

Lines changed: 0 additions & 35 deletions
This file was deleted.

charts/dual-pods-controller/templates/policies/validating-admission-policy-binding-fields.yaml

Lines changed: 0 additions & 16 deletions
This file was deleted.

charts/dual-pods-controller/templates/policies/validating-admission-policy-binding-serverReqPod.yaml

Lines changed: 0 additions & 16 deletions
This file was deleted.

charts/dual-pods-controller/templates/policies/validating-admission-policy-bound-serverReqPod.yaml

Lines changed: 0 additions & 32 deletions
This file was deleted.

charts/dual-pods-controller/templates/policies/validating-admission-policy-immutable-fields.yaml

Lines changed: 0 additions & 29 deletions
This file was deleted.

0 commit comments

Comments
 (0)