rebellions-sw
diff --git a/‎src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py‎
Lines changed: 3 additions & 3 deletions b/‎src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎src/optimum/rbln/diffusers/models/controlnet.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/diffusers/models/controlnet.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/diffusers/models/transformers/prior_transformer.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/diffusers/models/transformers/prior_transformer.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/diffusers/models/transformers/transformer_cosmos.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/diffusers/models/transformers/transformer_cosmos.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/modeling.py‎
Lines changed: 2 additions & 45 deletions b/‎src/optimum/rbln/modeling.py‎
Lines changed: 2 additions & 45 deletions
diff --git a/‎src/optimum/rbln/transformers/modeling_generic.py‎
Lines changed: 2 additions & 2 deletions b/‎src/optimum/rbln/transformers/modeling_generic.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/optimum/rbln/transformers/models/bart/modeling_bart.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/transformers/models/bart/modeling_bart.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/optimum/rbln/transformers/models/bert/modeling_bert.py‎
Lines changed: 1 addition & 1 deletion b/‎src/optimum/rbln/transformers/models/bert/modeling_bert.py‎
Lines changed: 1 addition & 1 deletion
@@ -68,7 +68,7 @@ def __post_init__(self, **kwargs):
         self.image_size = self.rbln_config.image_size
 
     @classmethod
-    def wrap_model_if_needed(
+    def _wrap_model_if_needed(
         cls, model: torch.nn.Module, rbln_config: RBLNAutoencoderKLCosmosConfig
     ) -> torch.nn.Module:
         decoder_model = _VAECosmosDecoder(model)
@@ -98,7 +98,7 @@ def replaced_forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
 
             compiled_models = {}
             if rbln_config.uses_encoder:
-                encoder_model, decoder_model = cls.wrap_model_if_needed(model, rbln_config)
+                encoder_model, decoder_model = cls._wrap_model_if_needed(model, rbln_config)
                 enc_compiled_model = cls.compile(
                     encoder_model,
                     rbln_compile_config=rbln_config.compile_cfgs[0],
@@ -107,7 +107,7 @@ def replaced_forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
                 )
                 compiled_models["encoder"] = enc_compiled_model
             else:
-                decoder_model = cls.wrap_model_if_needed(model, rbln_config)
+                decoder_model = cls._wrap_model_if_needed(model, rbln_config)
             dec_compiled_model = cls.compile(
                 decoder_model,
                 rbln_compile_config=rbln_config.compile_cfgs[-1],
 
@@ -118,7 +118,7 @@ def __post_init__(self, **kwargs):
         )
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
         use_encoder_hidden_states = False
         for down_block in model.down_blocks:
             if use_encoder_hidden_states := getattr(down_block, "has_cross_attention", False):
 
@@ -77,7 +77,7 @@ def __post_init__(self, **kwargs):
         self.clip_std = artifacts["clip_std"]
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
         return _PriorTransformer(model).eval()
 
     @classmethod
 
@@ -185,7 +185,7 @@ def compute_embedding(
         )
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
         num_latent_frames = rbln_config.num_latent_frames
         latent_height = rbln_config.latent_height
         latent_width = rbln_config.latent_width
 
@@ -77,7 +77,7 @@ def __post_init__(self, **kwargs):
         super().__post_init__(**kwargs)
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
         return SD3Transformer2DModelWrapper(model).eval()
 
     @classmethod
 
@@ -171,7 +171,7 @@ class ADDEMBEDDING:
             self.add_embedding = ADDEMBEDDING(LINEAR1(self.in_features))
 
     @classmethod
-    def wrap_model_if_needed(
+    def _wrap_model_if_needed(
         cls, model: torch.nn.Module, rbln_config: RBLNUNet2DConditionModelConfig
     ) -> torch.nn.Module:
         if model.config.addition_embed_type == "text_time":
 
@@ -34,49 +34,6 @@
 logger = get_logger(__name__)
 
 
-def _get_dtype(
-    cls,
-    dtype: Optional[Union[str, torch.dtype, dict]],
-    config: PretrainedConfig,
-) -> tuple[PretrainedConfig, Optional[torch.dtype], Optional[torch.dtype]]:
-    dtype_orig = None
-
-    if dtype is not None:
-        if isinstance(dtype, str):
-            if dtype == "auto":
-                if hasattr(config, "dtype") and config.dtype is not None:
-                    dtype = config.dtype
-                else:
-                    dtype = torch.get_default_dtype()
-            elif hasattr(torch, dtype):
-                dtype = getattr(torch, dtype)
-                config.dtype = dtype
-        elif isinstance(dtype, torch.dtype):
-            config.dtype = dtype
-        elif isinstance(dtype, dict):
-            for key, curr_dtype in dtype.items():
-                if hasattr(config, key):
-                    value = getattr(config, key)
-                    curr_dtype = curr_dtype if not isinstance(curr_dtype, str) else getattr(torch, curr_dtype)
-                    value.dtype = curr_dtype
-            # main torch dtype for modules that aren't part of any sub-config
-            dtype = dtype.get("")
-            dtype = dtype if not isinstance(dtype, str) else getattr(torch, dtype)
-            config.dtype = dtype
-            if dtype is None:
-                dtype = torch.float32
-        else:
-            raise ValueError(f"Invalid dtype: {dtype}")
-
-        dtype_orig = cls._set_default_dtype(dtype)
-    else:
-        # Use default dtype
-        default_dtype = torch.get_default_dtype()
-        config.dtype = default_dtype
-
-    return config, dtype, dtype_orig
-
-
 class RBLNModel(RBLNBaseModel):
     @classmethod
     def update_kwargs(cls, kwargs):
@@ -97,13 +54,13 @@ def save_torch_artifacts(
         pass
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:
         # Wrap the model if needed.
         return model
 
     @classmethod
     def get_compiled_model(cls, model: "PreTrainedModel", rbln_config: RBLNModelConfig):
-        model = cls.wrap_model_if_needed(model, rbln_config)
+        model = cls._wrap_model_if_needed(model, rbln_config)
         rbln_compile_config = rbln_config.compile_cfgs[0]
         compiled_model = cls.compile(
             model,
 
@@ -59,7 +59,7 @@ class RBLNTransformerEncoder(RBLNModel):
     rbln_dtype = "int64"
 
     @classmethod
-    def wrap_model_if_needed(cls, model: "PreTrainedModel", rbln_config: RBLNTransformerEncoderConfig) -> nn.Module:
+    def _wrap_model_if_needed(cls, model: "PreTrainedModel", rbln_config: RBLNTransformerEncoderConfig) -> nn.Module:
         class TransformerEncoderWrapper(nn.Module):
             # Parameters to disable for RBLN compilation
             DISABLED_PARAMS = {"return_dict", "use_cache"}
@@ -268,7 +268,7 @@ class RBLNModelForDepthEstimation(RBLNImageModel):
     auto_model_class = AutoModelForDepthEstimation
 
     @classmethod
-    def wrap_model_if_needed(cls, model: "PreTrainedModel", rbln_config: RBLNImageModelConfig):
+    def _wrap_model_if_needed(cls, model: "PreTrainedModel", rbln_config: RBLNImageModelConfig):
         class ImageModelWrapper(nn.Module):
             def __init__(self, model: "PreTrainedModel", rbln_config: RBLNImageModelConfig):
                 super().__init__()
 
@@ -48,7 +48,7 @@ class RBLNBartForConditionalGeneration(RBLNModelForSeq2SeqLM):
     support_causal_attn = True
 
     @classmethod
-    def wrap_model_if_needed(self, model: PreTrainedModel, rbln_config: RBLNBartForConditionalGenerationConfig):
+    def _wrap_model_if_needed(self, model: PreTrainedModel, rbln_config: RBLNBartForConditionalGenerationConfig):
         return BartWrapper(
             model, enc_max_seq_len=rbln_config.enc_max_seq_len, use_attention_mask=rbln_config.use_attention_mask
         )
 
@@ -35,7 +35,7 @@ class RBLNBertModel(RBLNTransformerEncoderForFeatureExtraction):
     rbln_model_input_names = ["input_ids", "attention_mask"]
 
     @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNBertModelConfig) -> torch.nn.Module:
+    def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNBertModelConfig) -> torch.nn.Module:
         return BertModelWrapper(model, rbln_config)
Original file line number	Diff line number	Diff line change
`@@ -118,7 +118,7 @@ def __post_init__(self, **kwargs):`
`118`	`118`	`)`
`119`	`119`
`120`	`120`	`@classmethod`
`121`		`- def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:`
	`121`	`+ def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:`
`122`	`122`	`use_encoder_hidden_states = False`
`123`	`123`	`for down_block in model.down_blocks:`
`124`	`124`	`if use_encoder_hidden_states := getattr(down_block, "has_cross_attention", False):`
Original file line number	Diff line number	Diff line change
`@@ -185,7 +185,7 @@ def compute_embedding(`
`185`	`185`	`)`
`186`	`186`
`187`	`187`	`@classmethod`
`188`		`- def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:`
	`188`	`+ def _wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNModelConfig) -> torch.nn.Module:`
`189`	`189`	`num_latent_frames = rbln_config.num_latent_frames`
`190`	`190`	`latent_height = rbln_config.latent_height`
`191`	`191`	`latent_width = rbln_config.latent_width`
Original file line number	Diff line number	Diff line change
`@@ -48,7 +48,7 @@ class RBLNBartForConditionalGeneration(RBLNModelForSeq2SeqLM):`
`48`	`48`	`support_causal_attn = True`
`49`	`49`
`50`	`50`	`@classmethod`
`51`		`- def wrap_model_if_needed(self, model: PreTrainedModel, rbln_config: RBLNBartForConditionalGenerationConfig):`
	`51`	`+ def _wrap_model_if_needed(self, model: PreTrainedModel, rbln_config: RBLNBartForConditionalGenerationConfig):`
`52`	`52`	`return BartWrapper(`
`53`	`53`	`model, enc_max_seq_len=rbln_config.enc_max_seq_len, use_attention_mask=rbln_config.use_attention_mask`
`54`	`54`	`)`