We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent b5a1595 commit 5128a75Copy full SHA for 5128a75
tests/test_paged_prefix_caching.py
@@ -26,7 +26,7 @@ def _make_paged_runner(num_layers: int = 2) -> mr.MetalModelRunner:
26
runner = mr.MetalModelRunner.__new__(mr.MetalModelRunner)
27
runner.model = MagicMock()
28
runner._is_stt = False
29
- runner._paged_kv_cache = MagicMock() # non-None enables paged path
+ runner._paged_attention_backend = MagicMock() # non-None enables paged path
30
runner._paged_block_size = 4
31
runner._paged_request_seq_lens = {}
32
runner._request_states = {}
0 commit comments