merge: resolve conflict with main in gate_factory.go

lioraron · claude · lioraron · commit f323b66ef3e1 · 2026-04-16T12:19:39.000-04:00
Keep both the DefaultCacheTTL constant from this branch and the
GateFactory interface compliance check added on main.

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/pkg/async/api/api.go b/pkg/async/api/api.go
@@ -41,6 +41,8 @@ type GateFactory interface {
 	CreateGate(gateType string, params map[string]string) (DispatchGate, error)
 }
 
+var _ DispatchGate = DispatchGateFunc(nil)
+
 // DispatchGateFunc is a function type that implements DispatchGate.
 // This allows any function with the signature func(context.Context) float64
 // to be used as a DispatchGate.
diff --git a/pkg/async/api/http_client.go b/pkg/async/api/http_client.go
@@ -8,6 +8,8 @@ import (
 	"net/http"
 )
 
+var _ InferenceClient = (*HTTPInferenceClient)(nil)
+
 // HTTPInferenceClient is the default HTTP implementation of InferenceClient.
 type HTTPInferenceClient struct {
 	client *http.Client
diff --git a/pkg/async/api/inference_error.go b/pkg/async/api/inference_error.go
@@ -31,6 +31,8 @@ type InferenceError interface {
 	Category() ErrorCategory
 }
 
+var _ InferenceError = (*ClientError)(nil)
+
 // ClientError represents an inference client error with category and context.
 type ClientError struct {
 	ErrorCategory ErrorCategory
diff --git a/pkg/async/inference/flowcontrol/binary_metric_dispatch_gate.go b/pkg/async/inference/flowcontrol/binary_metric_dispatch_gate.go
@@ -20,6 +20,7 @@ import (
 	"context"
 	"flag"
 
+	asyncapi "github.com/llm-d-incubation/llm-d-async/pkg/async/api"
 	"github.com/prometheus/client_golang/api"
 	"sigs.k8s.io/controller-runtime/pkg/log"
 	logutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
@@ -30,6 +31,8 @@ var prometheusURL = flag.String("gate.prometheus.url", "", "Prometheus URL for n
 var gmpProjectID = flag.String("gate.pmetric.gmp.project-id", "", "Project ID for Google Managed Prometheus")
 var prometheusQueryModelName = flag.String("gate.prometheus.model-name", "", "metrics name to use for avg_queue_size")
 
+var _ asyncapi.DispatchGate = (*BinaryMetricDispatchGate)(nil)
+
 // BinaryMetricDispatchGate implements DispatchGate using a MetricSource.
 // It returns 0.0 (no capacity) if the metric value is non-zero,
 // and 1.0 (full capacity) if the metric value is zero.
diff --git a/pkg/async/inference/flowcontrol/dispatch_gate.go b/pkg/async/inference/flowcontrol/dispatch_gate.go
@@ -22,6 +22,8 @@ import (
 	"github.com/llm-d-incubation/llm-d-async/pkg/async/api"
 )
 
+var _ api.DispatchGate = DispatchGateFunc(nil)
+
 // DispatchGateFunc is a function type that implements DispatchGate.
 // This allows any function with the signature func(context.Context) float64
 // to be used as a DispatchGate.
diff --git a/pkg/async/inference/flowcontrol/gate_factory.go b/pkg/async/inference/flowcontrol/gate_factory.go
@@ -30,6 +30,8 @@ import (
 // DefaultCacheTTL is the default TTL for cached Prometheus metric sources.
 const DefaultCacheTTL = 5 * time.Second
 
+var _ asyncapi.GateFactory = (*GateFactory)(nil)
+
 // GateFactory creates DispatchGate instances based on configuration.
 type GateFactory struct {
 	prometheusURL string
diff --git a/pkg/async/inference/flowcontrol/metric_source.go b/pkg/async/inference/flowcontrol/metric_source.go
@@ -46,6 +46,8 @@ type MetricSource interface {
 	Query(ctx context.Context) ([]Sample, error)
 }
 
+var _ MetricSource = (*PromQLMetricSource)(nil)
+
 // PromQLMetricSource implements MetricSource by executing a PromQL expression
 // against a Prometheus-compatible API.
 type PromQLMetricSource struct {
diff --git a/pkg/async/inference/flowcontrol/saturation_metric_dispatch_gate.go b/pkg/async/inference/flowcontrol/saturation_metric_dispatch_gate.go
@@ -21,6 +21,7 @@ import (
 	"flag"
 	"math"
 
+	asyncapi "github.com/llm-d-incubation/llm-d-async/pkg/async/api"
 	"github.com/prometheus/client_golang/api"
 	"sigs.k8s.io/controller-runtime/pkg/log"
 	logutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
@@ -31,6 +32,8 @@ var saturationThreshold = flag.Float64("gate.saturation.threshold", 0.8, "satura
 var saturationFallback = flag.Float64("gate.saturation.fallback", 0.0, "fallback saturation value on error/missing metrics; default 0.0")
 var saturationQueryExpr = flag.String("gate.saturation.query-expr", "", "custom PromQL expression for saturation metric; overrides inference-pool label selector")
 
+var _ asyncapi.DispatchGate = (*SaturationMetricDispatchGate)(nil)
+
 // SaturationMetricDispatchGate implements DispatchGate based on pool saturation.
 // It queries a MetricSource for saturation samples and returns 0.0 if saturation
 // is at or above the configured threshold, otherwise returns max(0, 1 - saturation),
diff --git a/pkg/async/random_robin_policy.go b/pkg/async/random_robin_policy.go
@@ -10,11 +10,13 @@ func NewRandomRobinPolicy() api.RequestMergePolicy {
 	return &RandomRobinPolicy{}
 }
 
+var _ api.RequestMergePolicy = (*RandomRobinPolicy)(nil)
+
 type RandomRobinPolicy struct {
 }
 
 func (r *RandomRobinPolicy) MergeRequestChannels(channels []api.RequestChannel) api.EmbelishedRequestChannel {
-	mergedChannel := make(chan api.EmbelishedRequestMessage)
+	mergedChannel := make(chan api.EmbelishedRequestMessage, len(channels))
 
 	cases := make([]reflect.SelectCase, len(channels)) //nolint:staticcheck
 	for i, ch := range channels {
diff --git a/pkg/async/random_robin_policy_test.go b/pkg/async/random_robin_policy_test.go
@@ -2,6 +2,7 @@ package async
 
 import (
 	"testing"
+	"time"
 
 	"github.com/llm-d-incubation/llm-d-async/pkg/async/api"
 )
@@ -41,3 +42,33 @@ func TestProcessAllChannels(t *testing.T) {
 		}
 	}
 }
+
+func TestMergedChannelIsBuffered(t *testing.T) {
+	numChannels := 3
+	channels := make([]api.RequestChannel, numChannels)
+	for i := range numChannels {
+		channels[i] = api.RequestChannel{Channel: make(chan api.RequestMessage, 1)}
+	}
+	policy := NewRandomRobinPolicy()
+	merged := policy.MergeRequestChannels(channels)
+
+	// Send one message per input channel.
+	for i, ch := range channels {
+		ch.Channel <- api.RequestMessage{Id: string(rune('A' + i))}
+	}
+
+	// The merge goroutine should be able to forward all messages into the
+	// buffered merged channel without a consumer draining it. With an
+	// unbuffered channel this would deadlock because the goroutine blocks
+	// on the first send.
+	deadline := time.After(2 * time.Second)
+	received := 0
+	for received < numChannels {
+		select {
+		case <-merged.Channel:
+			received++
+		case <-deadline:
+			t.Fatalf("timed out: only received %d/%d messages — merged channel may be unbuffered", received, numChannels)
+		}
+	}
+}
diff --git a/pkg/producer/redis_sortedset_producer.go b/pkg/producer/redis_sortedset_producer.go
@@ -12,6 +12,8 @@ import (
 	"github.com/redis/go-redis/v9"
 )
 
+var _ Producer = (*RedisSortedSetProducer)(nil)
+
 // RedisSortedSetProducer implements Producer using Redis sorted set for requests
 // and Redis list for results.
 type RedisSortedSetProducer struct {
diff --git a/pkg/pubsub/pubsubimpl.go b/pkg/pubsub/pubsubimpl.go
@@ -43,6 +43,9 @@ type TopicConfig struct {
 	GateType           string            `json:"gate_type"`
 	GateParams         map[string]string `json:"gate_params,omitempty"`
 }
+
+var _ api.Flow = (*PubSubMQFlow)(nil)
+
 type PubSubMQFlow struct {
 	resultTopicID   string
 	requestChannels []RequestChannelData
diff --git a/pkg/redis/dispatch_gate.go b/pkg/redis/dispatch_gate.go
@@ -4,11 +4,14 @@ import (
 	"context"
 	"strconv"
 
+	"github.com/llm-d-incubation/llm-d-async/pkg/async/api"
 	goredis "github.com/redis/go-redis/v9"
 	"sigs.k8s.io/controller-runtime/pkg/log"
 	logutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
 )
 
+var _ api.DispatchGate = (*RedisDispatchGate)(nil)
+
 // RedisDispatchGate implements api.DispatchGate by reading the budget
 // from a Redis key. This allows external systems to dynamically control
 // the dispatch rate. If the key does not exist or is invalid, it defaults
diff --git a/pkg/redis/redisimpl.go b/pkg/redis/redisimpl.go
@@ -76,6 +76,8 @@ type RequestChannelData struct {
 	queueName      string
 }
 
+var _ api.Flow = (*RedisMQFlow)(nil)
+
 type RedisMQFlow struct {
 	rdb             *redis.Client
 	requestChannels []RequestChannelData
diff --git a/pkg/redis/sortedset_impl.go b/pkg/redis/sortedset_impl.go
@@ -61,6 +61,8 @@ type requestChannelData struct {
 	gate      api.DispatchGate
 }
 
+var _ api.Flow = (*RedisSortedSetFlow)(nil)
+
 type RedisSortedSetFlow struct {
 	rdb             *redis.Client
 	requestChannels []requestChannelData

Original file line number	Diff line number	Diff line change
`@@ -41,6 +41,8 @@ type GateFactory interface {`
`41`	`41`	`CreateGate(gateType string, params map[string]string) (DispatchGate, error)`
`42`	`42`	`}`
`43`	`43`
	`44`	`+var _ DispatchGate = DispatchGateFunc(nil)`
	`45`	`+`
`44`	`46`	`// DispatchGateFunc is a function type that implements DispatchGate.`
`45`	`47`	`// This allows any function with the signature func(context.Context) float64`
`46`	`48`	`// to be used as a DispatchGate.`
Original file line number	Diff line number	Diff line change
`@@ -8,6 +8,8 @@ import (`
`8`	`8`	`"net/http"`
`9`	`9`	`)`
`10`	`10`
	`11`	`+var _ InferenceClient = (*HTTPInferenceClient)(nil)`
	`12`	`+`
`11`	`13`	`// HTTPInferenceClient is the default HTTP implementation of InferenceClient.`
`12`	`14`	`type HTTPInferenceClient struct {`
`13`	`15`	`client *http.Client`
Original file line number	Diff line number	Diff line change
`@@ -31,6 +31,8 @@ type InferenceError interface {`
`31`	`31`	`Category() ErrorCategory`
`32`	`32`	`}`
`33`	`33`
	`34`	`+var _ InferenceError = (*ClientError)(nil)`
	`35`	`+`
`34`	`36`	`// ClientError represents an inference client error with category and context.`
`35`	`37`	`type ClientError struct {`
`36`	`38`	`ErrorCategory ErrorCategory`
Original file line number	Diff line number	Diff line change
`@@ -22,6 +22,8 @@ import (`
`22`	`22`	`"github.com/llm-d-incubation/llm-d-async/pkg/async/api"`
`23`	`23`	`)`
`24`	`24`
	`25`	`+var _ api.DispatchGate = DispatchGateFunc(nil)`
	`26`	`+`
`25`	`27`	`// DispatchGateFunc is a function type that implements DispatchGate.`
`26`	`28`	`// This allows any function with the signature func(context.Context) float64`
`27`	`29`	`// to be used as a DispatchGate.`
Original file line number	Diff line number	Diff line change
`@@ -46,6 +46,8 @@ type MetricSource interface {`
`46`	`46`	`Query(ctx context.Context) ([]Sample, error)`
`47`	`47`	`}`
`48`	`48`
	`49`	`+var _ MetricSource = (*PromQLMetricSource)(nil)`
	`50`	`+`
`49`	`51`	`// PromQLMetricSource implements MetricSource by executing a PromQL expression`
`50`	`52`	`// against a Prometheus-compatible API.`
`51`	`53`	`type PromQLMetricSource struct {`
Original file line number	Diff line number	Diff line change
`@@ -10,11 +10,13 @@ func NewRandomRobinPolicy() api.RequestMergePolicy {`
`10`	`10`	`return &RandomRobinPolicy{}`
`11`	`11`	`}`
`12`	`12`
	`13`	`+var _ api.RequestMergePolicy = (*RandomRobinPolicy)(nil)`
	`14`	`+`
`13`	`15`	`type RandomRobinPolicy struct {`
`14`	`16`	`}`
`15`	`17`
`16`	`18`	`func (r *RandomRobinPolicy) MergeRequestChannels(channels []api.RequestChannel) api.EmbelishedRequestChannel {`
`17`		`- mergedChannel := make(chan api.EmbelishedRequestMessage)`
	`19`	`+ mergedChannel := make(chan api.EmbelishedRequestMessage, len(channels))`
`18`	`20`
`19`	`21`	`cases := make([]reflect.SelectCase, len(channels)) //nolint:staticcheck`
`20`	`22`	`for i, ch := range channels {`