foldl
diff --git a/‎CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions b/‎CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 0 deletions b/‎README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎convert.py‎
Lines changed: 41 additions & 2 deletions b/‎convert.py‎
Lines changed: 41 additions & 2 deletions
diff --git a/‎docs/fun.md‎
Lines changed: 4 additions & 0 deletions b/‎docs/fun.md‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎docs/models.md‎
Lines changed: 7 additions & 0 deletions b/‎docs/models.md‎
Lines changed: 7 additions & 0 deletions
@@ -106,6 +106,7 @@ set(core_files src/backend.cpp
     models/orpheus.cpp
     models/openchat.cpp
     models/orion.cpp
+    models/ouro.cpp
     models/oute.cpp
     models/pangu.cpp
     models/phi.cpp
 
@@ -33,6 +33,7 @@ LittleAcademia[<a href="https://github.com/foldl/little-academia"   style="text-
 
 **What's New:**
 
+* 2025-11-03: Ouro
 * 2025-10-31: Megrez2-3x7B-A3B
 * 2025-10-25: LLaDA2.0-mini
 * 2025-10-14: Nanonets-OCR2
 
@@ -223,6 +223,8 @@ class ModelType(Enum):
 
     MegrezMoE       = 0x2F00
 
+    OURO            = 0x3000
+
     BCE_Embedding           = 0x10000100
     BCE_ReRanker            = 0x10000101
     BGE_M3                  = 0x10000102
@@ -8175,6 +8177,41 @@ def get_weight_names(config):
 
         return weight_names
 
+class OuroConverter(BaseConverter):
+    MODEL_TYPE = ModelType.OURO
+
+    @classmethod
+    def pp(cls, config, name: str, tensor):
+        return Llama3Converter.pp(config, name, tensor)
+
+    @staticmethod
+    def dump_config(f, config, ggml_type):
+        assert config.rope_scaling is None
+        assert (config.layer_types.count('full_attention') == config.num_hidden_layers) or \
+               (config.use_sliding_window is None) or (not config.use_sliding_window)
+        assert not config.tie_word_embeddings is None
+
+        dump_llama_like_config(f, config, ggml_type)
+        config_values = [
+            config.num_key_value_heads,
+            config.rope_theta,
+        ]
+        f.write(struct.pack("<if", *config_values))
+
+    @staticmethod
+    def get_weight_names(config):
+        weight_names = Llama3Converter.get_weight_names(config)
+        for i in range(config.num_hidden_layers):
+            weight_names += [
+                f"model.layers.{i}.input_layernorm_2.weight",
+                f"model.layers.{i}.post_attention_layernorm_2.weight",
+            ]
+        weight_names += [
+            f"model.early_exit_gate.bias",
+            f"model.early_exit_gate.weight",
+        ]
+        return weight_names
+
 def convert_grok_1_base(args, vocab, ggml_type):
     def ffn_size(emb_size, widening_factor):
         _ffn_size = int(widening_factor * emb_size) * 2 // 3
@@ -8793,10 +8830,12 @@ def main():
     elif arch == 'MultiModalityCausalLM':
         assert JanusConverter.is_proper_config(config)
         JanusConverter.convert(config, model_files, vocab, ggml_type, args.save_path)
-    elif arch.endswith('DotsOCRForCausalLM'):
+    elif arch == 'DotsOCRForCausalLM':
         DotsOCRConverter.convert(config, model_files, vocab, ggml_type, args.save_path)
-    elif arch.endswith('MegrezMoeForCausalLM'):
+    elif arch == 'MegrezMoeForCausalLM':
         MegrezMoEConverter.convert(config, model_files, vocab, ggml_type, args.save_path)
+    elif arch == 'OuroForCausalLM':
+        OuroConverter.convert(config, model_files, vocab, ggml_type, args.save_path)
     elif arch == 'deepseek-r1-distill-qwen3':
         QWen3Converter.MODEL_TYPE = ModelType.DeepSeek_R1_Distill_QWen3
         QWen3Converter.convert(config, model_files, vocab, ggml_type, args.save_path)
 
@@ -51,6 +51,10 @@ Before shuffling a model's layers, use `--show` to view basic information about
     ...
     ```
 
+> [!CAUTION]
+> Not all models support this. For example, a ordinal dense model like LlaMA supports this, but a heterogeneous model might
+> not support this (special treatment is needed for mapping a layer to its type).
+
 ## Talk to Each Other
 
 [Here](../scripts/crosstask.py) is a simple program to let two LLMs talk to each other.
 
@@ -228,6 +228,13 @@
     * [x] OLMoE: [Instruct-7B](https://huggingface.co/allenai/OLMoE-1B-7B-0924-Instruct)
     * [x] OLM-2: [Instruct-7B](https://huggingface.co/allenai/OLMo-2-1124-7B-Instruct), [Instruct-13B](https://huggingface.co/allenai/OLMo-2-1124-13B-Instruct), [Instruct-32B](https://huggingface.co/allenai/OLMo-2-0325-32B-Instruct/tree/5942a2f5e0bc38c2a5f5200cec2ea236d5984547)
 
+* Ouro (`OuroForCausalLM`)
+    * [x] [2.6B-Thinking](https://huggingface.co/ByteDance/Ouro-2.6B-Thinking/tree/a2d3a54cea06168ba371ec3e089734f715824d5b)
+
+        Note: additional options supported (`--set ...`)
+        * `total_ut_steps`: default 4
+        * `exit_threshold`: default 1.0
+
 * Orion (`OrionForCausalLM`)
     * [x] [Chat-14B](https://huggingface.co/OrionStarAI/Orion-14B-Chat)