We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f36b7fa commit 15a8a0aCopy full SHA for 15a8a0a
swift/megatron/arguments/megatron_args.py
@@ -700,7 +700,6 @@ def _init_mixed_precision(self):
700
if self.apply_query_key_layer_scaling:
701
os.environ['NVTE_APPLY_QK_LAYER_SCALING'] = '1'
702
703
- @staticmethod
704
def _init_moe(self):
705
if self.moe_router_dtype.lower() == 'none':
706
self.moe_router_dtype = None
@@ -775,7 +774,7 @@ def __post_init__(self):
775
774
logger.info('Setting args.tuner_type: lora')
776
if self.adapters:
777
self._load_adapter_config()
778
- MegatronArguments._init_moe(self)
+ self._init_moe()
779
self._init_mixed_precision()
780
781
self.megatron_extra_kwargs = json_parse_to_dict(self.megatron_extra_kwargs)
0 commit comments