waltforme
diff --git a/‎Makefile‎
Lines changed: 33 additions & 2 deletions b/‎Makefile‎
Lines changed: 33 additions & 2 deletions
diff --git a/‎charts/dpctlr/templates/deployment.yaml‎
Lines changed: 1 addition & 1 deletion b/‎charts/dpctlr/templates/deployment.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎charts/dpctlr/values.yaml‎
Lines changed: 4 additions & 0 deletions b/‎charts/dpctlr/values.yaml‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎cmd/dual-pods-controller/main.go‎
Lines changed: 1 addition & 1 deletion b/‎cmd/dual-pods-controller/main.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎cmd/test-requester/README.md‎
Lines changed: 48 additions & 0 deletions b/‎cmd/test-requester/README.md‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎cmd/test-requester/gpu-allocation.go‎
Lines changed: 211 additions & 0 deletions b/‎cmd/test-requester/gpu-allocation.go‎
Lines changed: 211 additions & 0 deletions
@@ -4,10 +4,16 @@ REQUESTER_IMG_TAG ?= latest
 REQUESTER_IMAGE := $(CONTAINER_IMG_REG)/$(REQUESTER_IMG_REPO):$(REQUESTER_IMG_TAG)
 
 CONTROLLER_IMG_TAG ?= $(shell git rev-parse --short HEAD)
-CONTROLLER_IMG ?= $(CONTAINER_IMG_REG)/dual-pod-controller:$(CONTROLLER_IMG_TAG)
+CONTROLLER_IMG ?= $(CONTAINER_IMG_REG)/dual-pods-controller:$(CONTROLLER_IMG_TAG)
+TEST_REQUESTER_IMG_TAG ?= $(shell git rev-parse --short HEAD)
+TEST_REQUESTER_IMG ?= $(CONTAINER_IMG_REG)/test-requester:$(TEST_REQUESTER_IMG_TAG)
+TEST_SERVER_IMG_TAG ?= $(shell git rev-parse --short HEAD)
+TEST_SERVER_IMG ?= $(CONTAINER_IMG_REG)/test-server:$(TEST_SERVER_IMG_TAG)
 
 TARGETARCH ?= $(shell go env GOARCH)
 
+CLUSTER_NAME ?= fmatest
+
 .PHONY: build-requester
 build-requester:
 	docker build -t $(REQUESTER_IMAGE) -f dockerfiles/Dockerfile.requester . --progress=plain --platform=linux/$(TARGETARCH)
@@ -18,10 +24,35 @@ push-requester:
 
 .PHONY: build-controller-local
 build-controller-local:
-	KO_DOCKER_REPO=ko.local ko build -B ./cmd/dual-pods-controller -t ${CONTROLLER_IMG_TAG}
+	KO_DOCKER_REPO=ko.local ko build -B ./cmd/dual-pods-controller -t ${CONTROLLER_IMG_TAG} --platform linux/$(shell go env GOARCH)
 	docker tag ko.local/dual-pods-controller:${CONTROLLER_IMG_TAG} ${CONTROLLER_IMG}
 
+.PHONY: load-controller-local
+load-controller-local:
+	kind load docker-image ${CONTROLLER_IMG} --name ${CLUSTER_NAME}
+
 .PHONY: build-controller
 build-controller:
 	KO_DOCKER_REPO=$(CONTAINER_IMG_REG) ko build -B ./cmd/dual-pods-controller -t ${CONTROLLER_IMG_TAG} --platform linux/amd64,linux/arm64
 
+.PHONY: build-test-requester-local
+build-test-requester-local:
+	KO_DOCKER_REPO=ko.local ko build -B ./cmd/test-requester -t ${TEST_REQUESTER_IMG_TAG} --platform linux/$(shell go env GOARCH)
+	docker tag ko.local/test-requester:${TEST_REQUESTER_IMG_TAG} ${TEST_REQUESTER_IMG}
+
+.PHONY: load-test-requester-local
+load-test-requester-local:
+	kind load docker-image ${TEST_REQUESTER_IMG} --name ${CLUSTER_NAME}
+
+.PHONY: build-test-server-local
+build-test-server-local:
+	KO_DOCKER_REPO=ko.local ko build -B ./cmd/test-server -t ${TEST_SERVER_IMG_TAG} --platform linux/$(shell go env GOARCH)
+	docker tag ko.local/test-server:${TEST_SERVER_IMG_TAG} ${TEST_SERVER_IMG}
+
+.PHONY: load-test-server-local
+load-test-server-local:
+	kind load docker-image ${TEST_SERVER_IMG} --name ${CLUSTER_NAME}
+
+.PHONY: echo-var
+echo-var:
+	@echo "$($(VAR))"
@@ -20,7 +20,7 @@ spec:
       containers:
       - name: controller
         image: {{ .Values.Image }}
-        imagePullPolicy: Always
+        imagePullPolicy: {{if .Values.Local}}Never{{else}}Always{{end}}
         command:
         - /ko-app/dual-pods-controller
         - "-v=5"
 
@@ -1,6 +1,10 @@
 # Of course, you never really want to use `:latest`
 Image: ghcr.io/llm-d-incubation/llm-d-fast-model-actuation-controller:latest
 
+# Set this to true when deploying in a local cluster.
+# This suppresses image pulls.
+Local: false
+
 # Name of the ClusterRole to bind to controller to authorize it to
 # get/list/watch Node objects.
 # Empty string means no new binding is needed.
 
@@ -65,7 +65,7 @@ func main() {
 
 	kubeClient := kubernetes.NewForConfigOrDie(restConfig)
 	if len(overrides.Context.Namespace) == 0 {
-		fmt.Fprint(os.Stderr, "Namespace must not be the empty string")
+		fmt.Fprintln(os.Stderr, "Namespace must not be the empty string")
 		os.Exit(1)
 	} else {
 		logger.Info("Focusing on one namespace", "name", overrides.Context.Namespace)
 
@@ -0,0 +1,48 @@
+# Test requester
+
+This is a variant of the normal requester that does not actually
+involve GPUs.  Instead of running `nvidia-smi` to discover what GPUs
+were assigned by the kubelet, this requester maintains GPU assignments
+in a ConfigMap named "gpu-allocs".
+
+For details, see the comment at the start of [the source](main.go).
+
+The command line arguments are as follows.
+
+## Requester specific arguments
+
+```console
+      --node string                      name of this Pod's Node
+      --num-gpus int                     number of GPUs to allocate (default 1)
+      --pod-uid string                   UID of this Pod
+      --probes-port int16                port number for /ready (default 8080)
+      --spi-port int16                   port for dual-pods requests (default 8081)
+```
+
+## kubectl arguments
+
+```console
+      --cluster string                   The name of the kubeconfig cluster to use
+      --context string                   The name of the kubeconfig context to use
+      --kubeconfig string                Path to the kubeconfig file to use
+  -n, --namespace string                 The name of the Kubernetes Namespace to work in (NOT optional)
+      --user string                      The name of the kubeconfig user to use
+```
+
+## Logging arguments
+
+```console
+      --add_dir_header                   If true, adds the file directory to the header of the log messages
+      --alsologtostderr                  log to standard error as well as files (no effect when -logtostderr=true)
+      --log_backtrace_at traceLocation   when logging hits line file:N, emit a stack trace (default :0)
+      --log_dir string                   If non-empty, write log files in this directory (no effect when -logtostderr=true)
+      --log_file string                  If non-empty, use this log file (no effect when -logtostderr=true)
+      --log_file_max_size uint           Defines the maximum size a log file can grow to (no effect when -logtostderr=true). Unit is megabytes. If the value is 0, the maximum file size is unlimited. (default 1800)
+      --logtostderr                      log to standard error instead of files (default true)
+      --one_output                       If true, only write logs to their native severity level (vs also writing to each lower severity level; no effect when -logtostderr=true)
+      --skip_headers                     If true, avoid header prefixes in the log messages
+      --skip_log_headers                 If true, avoid headers when opening log files (no effect when -logtostderr=true)
+      --stderrthreshold severity         logs at or above this threshold go to stderr when writing to files and stderr (no effect when -logtostderr=true or -alsologtostderr=true) (default 2)
+  -v, --v Level                          number for the log level verbosity
+      --vmodule moduleSpec               comma-separated list of pattern=N settings for file-filtered logging
+```
@@ -0,0 +1,211 @@
+/*
+Copyright 2025 The llm-d Authors.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+	http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package main
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"os"
+	"strings"
+	"time"
+
+	corev1 "k8s.io/api/core/v1"
+	apierrors "k8s.io/apimachinery/pkg/api/errors"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	apitypes "k8s.io/apimachinery/pkg/types"
+	"k8s.io/apimachinery/pkg/util/sets"
+	"k8s.io/apimachinery/pkg/util/wait"
+	corev1client "k8s.io/client-go/kubernetes/typed/core/v1"
+
+	dpctlr "github.com/llm-d-incubation/llm-d-fast-model-actuation/pkg/controller/dual-pods"
+
+	"k8s.io/klog/v2"
+)
+
+// This code maintains a ConfigMap named "gpu-allocs" that holds the current test allocations
+// of GPUs. The data of this ConfigMap is a map from GPU UID to the JSON marshaling of a GPUHolder.
+
+// gpuMap maps node name to nodeGPUMap
+type gpuMap map[string]nodeGPUMap
+
+// nodeGPUMap maps GPU UID to index
+type nodeGPUMap map[string]int
+
+// GPUHolder identifies a test requester that is currently allocated the use of a GPU
+type GPUHolder struct {
+	NodeName string
+	PodUID   apitypes.UID
+}
+
+// GPUAllocMap maps GPU UID to GPUHolder
+type GPUAllocMap map[string]GPUHolder
+
+func getGPUMap(ctx context.Context, cmClient corev1client.ConfigMapInterface) (gpuMap, error) {
+	cm, err := cmClient.Get(ctx, dpctlr.GPUMapName, metav1.GetOptions{})
+	if err != nil {
+		return nil, fmt.Errorf("failed to retrieve gpu-map ConfigMap: %w", err)
+	}
+	ans := gpuMap{}
+	for nodeName, mapStr := range cm.Data {
+		nm := nodeGPUMap{}
+		err := json.Unmarshal([]byte(mapStr), &nm)
+		if err != nil {
+			return nil, fmt.Errorf("failed to parse GPU map for node %s: %w", nodeName, err)
+		}
+		ans[nodeName] = nm
+	}
+	return ans, nil
+}
+
+func (gm gpuMap) onNode(nodeName string) sets.Set[string] {
+	ngm := gm[nodeName]
+	if ngm != nil {
+		return sets.KeySet(ngm)
+	}
+	return sets.New[string]()
+}
+
+func getGPUAlloc(ctx context.Context, cmClient corev1client.ConfigMapInterface) (GPUAllocMap, *corev1.ConfigMap, error) {
+	cm, err := cmClient.Get(ctx, allocMapName, metav1.GetOptions{})
+	if err != nil {
+		if apierrors.IsNotFound(err) {
+			// It up to us to create it
+			cmProto := corev1.ConfigMap{
+				TypeMeta: metav1.TypeMeta{
+					Kind:       "ConfigMap",
+					APIVersion: corev1.SchemeGroupVersion.String(),
+				},
+				ObjectMeta: metav1.ObjectMeta{
+					Name: allocMapName,
+				},
+			}
+			cm, err = cmClient.Create(ctx, &cmProto, metav1.CreateOptions{FieldManager: agentName})
+			if err != nil {
+				return nil, nil, fmt.Errorf("failed to create GPU allocation ConfigMap: %w", err)
+			}
+		} else {
+			return nil, nil, fmt.Errorf("failed to fetch GPU allocation ConfigMap: %w", err)
+		}
+	}
+	ans := GPUAllocMap{}
+	for gpuUID, holderStr := range cm.Data {
+		holderReader := strings.NewReader(holderStr)
+		var holder GPUHolder
+		decoder := json.NewDecoder(holderReader)
+		decoder.DisallowUnknownFields()
+		err = decoder.Decode(&holder)
+		if err != nil {
+			return nil, nil, fmt.Errorf("failed to decode GPU allocation for GPU UID %s: %w", gpuUID, err)
+		}
+		ans[gpuUID] = holder
+	}
+	cm = cm.DeepCopy()
+	if cm.Data == nil {
+		cm.Data = map[string]string{}
+	}
+	return ans, cm, nil
+}
+
+func allocateGPUs(ctx context.Context, coreClient corev1client.CoreV1Interface, nodeName, namespace string, podUID apitypes.UID, numGPUs uint) []string {
+	logger := klog.FromContext(ctx)
+	cmClient := coreClient.ConfigMaps(namespace)
+	podClient := coreClient.Pods(namespace)
+	var gpuUIDs []string
+	// try once to allocate the requested number of GPUs;
+	// on failure return explanatory error;
+	// on success return nil.
+	try := func(ctx context.Context) (err error) {
+		gpuMap, err := getGPUMap(ctx, cmClient)
+		if err != nil {
+			return err
+		}
+		avail := gpuMap.onNode(nodeName)
+		podUIDs, err := getPodUIDs(ctx, podClient)
+		if err != nil {
+			return err
+		}
+		if !podUIDs.Has(podUID) {
+			return fmt.Errorf("pod UID %q not found among current Pods", podUID)
+		}
+		// Get the current allocations, as a data structure and as a ConfigMap object.
+		gpuAllocMap, gpuAllocCM, err := getGPUAlloc(ctx, cmClient)
+		if err != nil {
+			return err
+		}
+		// Collect the ones used by other Pods on the same Node,
+		// and remove obsolete entries from the ConfigMap.
+		used := sets.New[string]()
+		for gpuUID, holder := range gpuAllocMap {
+			if holder.NodeName != nodeName {
+				continue
+			}
+			if !podUIDs.Has(holder.PodUID) {
+				delete(gpuAllocCM.Data, gpuUID)
+			} else if holder.PodUID != podUID {
+				used.Insert(gpuUID)
+			}
+		}
+		// Compute the sorted list of unused GPUs on the right Node.
+		rem := sets.List(avail.Difference(used))
+		if uint(len(rem)) < numGPUs {
+			return fmt.Errorf("fewer than %d GPUs available (%v) for node %q", numGPUs, rem, nodeName)
+		}
+		// Take the requested number
+		// FROM THE HEAD OF THE LIST --- this is a choice to aid making repeatable tests.
+		gpuUIDs = rem[:numGPUs]
+		for _, gpuUID := range gpuUIDs {
+			holder := GPUHolder{NodeName: nodeName, PodUID: podUID}
+			holderBytes, err := json.Marshal(holder)
+			if err != nil {
+				return fmt.Errorf("failed to marshal holder for GPU %s (%#v): %w", gpuUID, holder, err)
+			}
+			gpuAllocCM.Data[gpuUID] = string(holderBytes)
+		}
+		echo, err := cmClient.Update(ctx, gpuAllocCM, metav1.UpdateOptions{
+			FieldManager: agentName,
+		})
+		if err != nil {
+			return fmt.Errorf("failed to update GPU allocation ConfigMap: %w", err)
+		}
+		logger.Info("Successful allocation", "nodeName", nodeName, "podUID", podUID, "gpus", gpuUIDs, "newResourceVersion", echo.ResourceVersion)
+		return nil
+	}
+	err := wait.PollUntilContextCancel(ctx, time.Second, true, func(ctx context.Context) (bool, error) {
+		err := try(ctx)
+		if err != nil {
+			logger.Error(err, "Failed to allocate")
+		}
+		return err == nil, nil
+	})
+	if err != nil {
+		fmt.Fprintf(os.Stderr, "Failed to allocate GPUS: %s\n", err.Error())
+		os.Exit(100)
+	}
+	return gpuUIDs
+}
+
+func getPodUIDs(ctx context.Context, podClient corev1client.PodInterface) (sets.Set[apitypes.UID], error) {
+	podList, err := podClient.List(ctx, metav1.ListOptions{})
+	if err != nil {
+		return nil, err
+	}
+	uids, _ := dpctlr.SliceMap(podList.Items, func(pod corev1.Pod) (apitypes.UID, error) {
+		return pod.UID, nil
+	})
+	return sets.New(uids...), nil
+}