Skip to content
Merged
Show file tree
Hide file tree
Changes from 48 commits
Commits
Show all changes
50 commits
Select commit Hold shift + click to select a range
b228bb7
feat: implement decode first flow on lmcache connector
kyanokashi Dec 9, 2025
a436b50
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Dec 9, 2025
a6ae771
fix: error handling
kyanokashi Dec 10, 2025
58388eb
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Dec 11, 2025
04b7ffd
chore: add back todo comment
kyanokashi Dec 11, 2025
ce74f50
refactor: reduce code complexity and duplication
kyanokashi Dec 11, 2025
1de6035
refactor: improve header copying
kyanokashi Dec 11, 2025
c0ac69e
chore: add comment explaning the cache_hit_threshold field and the ne…
kyanokashi Dec 15, 2025
7ce5e19
refactor: enhance logging for cache hit threshold in decode flow
kyanokashi Dec 15, 2025
6430a02
refactor: improve error handling and observability when failing to un…
kyanokashi Dec 15, 2025
4c15d95
chore: add deleted informational comments
kyanokashi Dec 15, 2025
cac084f
typo
kyanokashi Dec 15, 2025
91c7a06
refactor: make error logs more descriptive of the failure reason
kyanokashi Dec 15, 2025
69d30b5
feat: add cache hit threshold to prefill request so prefill executes …
kyanokashi Dec 15, 2025
1ed1d89
fix: typo
kyanokashi Dec 17, 2025
515b385
refactor: assign 0 cache_hit_threshold before final decode attempt
kyanokashi Dec 17, 2025
4c8659e
chore: update comment according to feedback
kyanokashi Dec 17, 2025
878585b
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Dec 17, 2025
722b58e
chore: remove istio workaround
kyanokashi Dec 17, 2025
487d333
fix: set cache hit threshold to 0 in prefill request for consistent e…
kyanokashi Dec 18, 2025
cb00b52
refactor: update the log
kyanokashi Dec 22, 2025
88739c6
feat: support online decoding
kyanokashi Dec 22, 2025
9fbb2d1
fix: preserve request body in lmcache connector
kyanokashi Dec 31, 2025
7b18827
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Dec 31, 2025
460b9c8
fix: support sse format for streamed decode
kyanokashi Jan 2, 2026
a722510
chore: add and improve log descriptions
kyanokashi Jan 2, 2026
e2b3380
fix: typo
kyanokashi Jan 4, 2026
548e6c8
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Jan 5, 2026
160fb72
nit: undo capitalization
kyanokashi Jan 5, 2026
9a08dfb
fix: typos
kyanokashi Jan 5, 2026
7508f10
chore: improve error log observability
kyanokashi Jan 5, 2026
bd114fa
refactor: encapsulate http error checking in function and reuse
kyanokashi Jan 5, 2026
5a6a4f6
refactor: encapsulate and reuse code better
kyanokashi Jan 5, 2026
6e6ff8f
fix: lint error
kyanokashi Jan 6, 2026
ea60bf0
refactor: improve code encapsulation and reduce duplication
kyanokashi Jan 6, 2026
0cbc6f9
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Jan 6, 2026
fd43c17
refactor: rename and simplify SSE event signaling logic
kyanokashi Jan 6, 2026
7030e38
refactor: rename lmcache to shared storage protocol
kyanokashi Jan 8, 2026
f84046a
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Jan 16, 2026
2f0e99e
fix: remove unused function
kyanokashi Jan 16, 2026
ea3f1da
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Jan 23, 2026
2e35d85
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Jan 31, 2026
d71b10b
test: e2e tests
kyanokashi Jan 31, 2026
e34600f
chore: claude gitignore
kyanokashi Jan 31, 2026
efd638a
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Feb 2, 2026
5e988e5
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Feb 3, 2026
fbb12fc
fix: sim deployment
kyanokashi Feb 5, 2026
903249f
Merge branch 'main' into feat/sidecar/lmcache-connector/decode-first
kyanokashi Feb 5, 2026
f6024d1
feat: make linter running on new code configurable
kyanokashi Feb 6, 2026
5f042e7
fix: lint errors
kyanokashi Feb 6, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,7 @@ go.work.sum
# Environment Files
.DS_Store
.env
CLAUDE.md

# IDE files
.idea
Expand Down
2 changes: 1 addition & 1 deletion Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ export EPP_IMAGE ?= $(IMAGE_TAG_BASE):$(EPP_TAG)
SIDECAR_TAG ?= dev
SIDECAR_IMAGE_TAG_BASE ?= $(IMAGE_REGISTRY)/$(SIDECAR_IMAGE_NAME)
export SIDECAR_IMAGE ?= $(SIDECAR_IMAGE_TAG_BASE):$(SIDECAR_TAG)
VLLM_SIMULATOR_TAG ?= v0.6.1
VLLM_SIMULATOR_TAG ?= latest
VLLM_SIMULATOR_TAG_BASE ?= $(IMAGE_REGISTRY)/$(VLLM_SIMULATOR_IMAGE_NAME)
export VLLM_SIMULATOR_IMAGE ?= $(VLLM_SIMULATOR_TAG_BASE):$(VLLM_SIMULATOR_TAG)
NAMESPACE ?= hc4ai-operator
Expand Down
2 changes: 1 addition & 1 deletion cmd/pd-sidecar/main.go
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ var (
// supportedConnectors defines all valid P/D connector types
supportedConnectors = []string{
proxy.ConnectorNIXLV2,
proxy.ConnectorLMCache,
proxy.ConnectorSharedStorage,
proxy.ConnectorSGLang,
}
)
Expand Down
91 changes: 0 additions & 91 deletions pkg/sidecar/proxy/connector_lmcache.go

This file was deleted.

2 changes: 1 addition & 1 deletion pkg/sidecar/proxy/connector_nixlv2.go
Original file line number Diff line number Diff line change
Expand Up @@ -107,7 +107,7 @@ func (s *Server) runNIXLProtocolV2(w http.ResponseWriter, r *http.Request, prefi
pw := &bufferedResponseWriter{}
prefillHandler.ServeHTTP(pw, preq)

if pw.statusCode < 200 || pw.statusCode >= 300 {
if isHTTPError(pw.statusCode) {
s.logger.Error(err, "request failed", "code", pw.statusCode)
w.WriteHeader(pw.statusCode)
return
Expand Down
Loading
Loading