@@ -71,10 +71,10 @@ class VllmConfig:
7171 init = False , default_factory = dict
7272 )
7373
74- # Parallelism sizes are tunix-owned VllmConfig fields that require special
75- # processing before being passed to vLLM. They must not be passed via
76- # engine_kwargs, which is a direct pass-through to vLLM EngineArgs.
77- _SHARDING_KEYS : frozenset [str ] = dataclasses .field (
74+ # VllmConfig fields that require special processing before being passed to
75+ # vLLM and must not be passed via engine_kwargs, which is a raw pass-through
76+ # to vLLM EngineArgs.
77+ _RESERVED_KEYS : frozenset [str ] = dataclasses .field (
7878 default = frozenset (
7979 {"tensor_parallel_size" , "data_parallel_size" , "expert_parallel_size" }
8080 ),
@@ -85,11 +85,11 @@ class VllmConfig:
8585
8686 def __post_init__ (self , engine_kwargs : Optional [Dict [str , Any ]]):
8787 engine_kwargs = engine_kwargs or {}
88- illegal = self ._SHARDING_KEYS & engine_kwargs .keys ()
88+ illegal = self ._RESERVED_KEYS & engine_kwargs .keys ()
8989 if illegal :
9090 raise ValueError (
91- f"Sharding parallelism sizes must be set directly on VllmConfig, not"
92- f" passed via engine_kwargs: { sorted (illegal )} "
91+ f"VllmConfig fields must be set directly on VllmConfig, not passed "
92+ f" via engine_kwargs: { sorted (illegal )} "
9393 )
9494 self ._processed_engine_kwargs = engine_kwargs
9595 if engine_kwargs :
0 commit comments