We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 82a1bbc commit a2c280eCopy full SHA for a2c280e
1 file changed
vllm_rbln/worker/worker.py
@@ -392,7 +392,7 @@ def _init_cache_engine(self):
392
393
bind_kv_cache(self.compilation_config.static_forward_context,
394
self.cpu_cache)
395
- if not self.model_config.enforce_eager:
+ if not self.model_config.enforce_eager and envs.RBLN_COMPILE_MODEL:
396
for kv_cache in cpu_cache:
397
self.model_runner.compile_context.mark_static_address(kv_cache)
398
0 commit comments