update

gufengc · gufengc · commit 2c5e0a2bc6e2 · 2026-06-02T21:35:36.000+08:00
diff --git a/src/parallax/server/executor/mlx_executor.py b/src/parallax/server/executor/mlx_executor.py
@@ -199,7 +199,9 @@ def __init__(
             if chunked_prefill_size == 0:
                 chunked_prefill_size = None
             elif not enable_prefix_cache:
-                raise ValueError("Chunked prefill is not supported when disable prefix cache, please enable prefix cache or set --chunked-prefill-size 0")
+                raise ValueError(
+                    "Chunked prefill is not supported when disable prefix cache, please enable prefix cache or set --chunked-prefill-size 0"
+                )
 
         self.cache_manager = CacheManager(
             num_layers=self.num_shard_layers,
diff --git a/src/parallax/server/shard_loader.py b/src/parallax/server/shard_loader.py
@@ -39,6 +39,7 @@
     "GlmMoeDsaForCausalLM": "DeepseekV32ForCausalLM",
 }
 
+
 class MLXModelLoader:
     """
     Handles downloading model assets from Hugging Face (if needed) and loading

Original file line number	Diff line number	Diff line change
`@@ -39,6 +39,7 @@`
`39`	`39`	`"GlmMoeDsaForCausalLM": "DeepseekV32ForCausalLM",`
`40`	`40`	`}`
`41`	`41`
	`42`	`+`
`42`	`43`	`class MLXModelLoader:`
`43`	`44`	`"""`
`44`	`45`	`Handles downloading model assets from Hugging Face (if needed) and loading`