Skip to content

Commit 2c5e0a2

Browse files
committed
update
1 parent aca20c8 commit 2c5e0a2

2 files changed

Lines changed: 4 additions & 1 deletion

File tree

src/parallax/server/executor/mlx_executor.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -199,7 +199,9 @@ def __init__(
199199
if chunked_prefill_size == 0:
200200
chunked_prefill_size = None
201201
elif not enable_prefix_cache:
202-
raise ValueError("Chunked prefill is not supported when disable prefix cache, please enable prefix cache or set --chunked-prefill-size 0")
202+
raise ValueError(
203+
"Chunked prefill is not supported when disable prefix cache, please enable prefix cache or set --chunked-prefill-size 0"
204+
)
203205

204206
self.cache_manager = CacheManager(
205207
num_layers=self.num_shard_layers,

src/parallax/server/shard_loader.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@
3939
"GlmMoeDsaForCausalLM": "DeepseekV32ForCausalLM",
4040
}
4141

42+
4243
class MLXModelLoader:
4344
"""
4445
Handles downloading model assets from Hugging Face (if needed) and loading

0 commit comments

Comments
 (0)