File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1212# Inject the build-time tag into the provider binary so it
1313# tracks /versions.env automatically. The Go fallback in config.go only
1414# applies when bypassing this Makefile (e.g. `go run`, `go test`).
15- LDFLAGS := -X github.com/kaito-project/airunway/providers/llmd.LLMDSchedulerImage= $(LLMD_VERSION )
15+ LDFLAGS := -X github.com/kaito-project/airunway/providers/llmd.LLMDSchedulerVersion=ghcr.io/llm-d/llm-d-inference-scheduler:v $(LLMD_VERSION )
1616
1717.PHONY : build vet test docker-build deploy generate-deploy-manifests
1818
Original file line number Diff line number Diff line change @@ -44,14 +44,6 @@ const (
4444 // HeartbeatInterval is the interval for updating the provider heartbeat
4545 HeartbeatInterval = 1 * time .Minute
4646
47- // LLMDSchedulerImage is the llm-d Inference Scheduler image used as the
48- // EPP for all llm-d ModelDeployments.
49- //
50- // Source of truth: /versions.env at the repo root.
51- // (see providers/llmd/Makefile). The string literal below is a fallback for
52- // `go run` / `go test` invocations that bypass the Makefile.
53- LLMDSchedulerImage = "ghcr.io/llm-d/llm-d-inference-scheduler:v0.6.0"
54-
5547 // LLMDSchedulerDefaultConfig is the default EndpointPickerConfig shipped
5648 // with the llm-d provider. It mirrors deploy/config/epp-config.yaml from
5749 // llm-d-inference-scheduler: a heuristic prefix-cache scorer
@@ -75,6 +67,14 @@ schedulingProfiles:
7567`
7668)
7769
70+ // LLMDSchedulerImage is the llm-d Inference Scheduler image used as the
71+ // EPP for all llm-d ModelDeployments.
72+ //
73+ // Source of truth: /versions.env at the repo root.
74+ // (see providers/llmd/Makefile). The string literal below is a fallback for
75+ // `go run` / `go test` invocations that bypass the Makefile.
76+ var LLMDSchedulerImage = "ghcr.io/llm-d/llm-d-inference-scheduler:v0.6.0"
77+
7878// ProviderConfigManager handles registration and heartbeat for the llm-d provider
7979type ProviderConfigManager struct {
8080 client client.Client
You can’t perform that action at this time.
0 commit comments