Skip to content

Commit e557236

Browse files
committed
fix last commit
Signed-off-by: Eric Bishop <ericbish.dev@gmail.com>
1 parent 9cd3bfa commit e557236

2 files changed

Lines changed: 9 additions & 9 deletions

File tree

providers/llmd/Makefile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ export
1212
# Inject the build-time tag into the provider binary so it
1313
# tracks /versions.env automatically. The Go fallback in config.go only
1414
# applies when bypassing this Makefile (e.g. `go run`, `go test`).
15-
LDFLAGS := -X github.com/kaito-project/airunway/providers/llmd.LLMDSchedulerImage=$(LLMD_VERSION)
15+
LDFLAGS := -X github.com/kaito-project/airunway/providers/llmd.LLMDSchedulerVersion=ghcr.io/llm-d/llm-d-inference-scheduler:v$(LLMD_VERSION)
1616

1717
.PHONY: build vet test docker-build deploy generate-deploy-manifests
1818

providers/llmd/config.go

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -44,14 +44,6 @@ const (
4444
// HeartbeatInterval is the interval for updating the provider heartbeat
4545
HeartbeatInterval = 1 * time.Minute
4646

47-
// LLMDSchedulerImage is the llm-d Inference Scheduler image used as the
48-
// EPP for all llm-d ModelDeployments.
49-
//
50-
// Source of truth: /versions.env at the repo root.
51-
// (see providers/llmd/Makefile). The string literal below is a fallback for
52-
// `go run` / `go test` invocations that bypass the Makefile.
53-
LLMDSchedulerImage = "ghcr.io/llm-d/llm-d-inference-scheduler:v0.6.0"
54-
5547
// LLMDSchedulerDefaultConfig is the default EndpointPickerConfig shipped
5648
// with the llm-d provider. It mirrors deploy/config/epp-config.yaml from
5749
// llm-d-inference-scheduler: a heuristic prefix-cache scorer
@@ -75,6 +67,14 @@ schedulingProfiles:
7567
`
7668
)
7769

70+
// LLMDSchedulerImage is the llm-d Inference Scheduler image used as the
71+
// EPP for all llm-d ModelDeployments.
72+
//
73+
// Source of truth: /versions.env at the repo root.
74+
// (see providers/llmd/Makefile). The string literal below is a fallback for
75+
// `go run` / `go test` invocations that bypass the Makefile.
76+
var LLMDSchedulerImage = "ghcr.io/llm-d/llm-d-inference-scheduler:v0.6.0"
77+
7878
// ProviderConfigManager handles registration and heartbeat for the llm-d provider
7979
type ProviderConfigManager struct {
8080
client client.Client

0 commit comments

Comments
 (0)