chore(model gallery): 🤖 add new models via gallery agent

mudler · github-actions[bot] · commit 764c976f272f · 2026-01-08T06:09:02.000Z
Signed-off-by: github-actions[bot] &lt;41898282+github-actions[bot]@users.noreply.github.com&gt;
diff --git a/gallery/index.yaml b/gallery/index.yaml
@@ -1,4 +1,29 @@
 ---
+- name: "thinkfl-llama3-8b"
+  url: "github:mudler/LocalAI/gallery/virtual.yaml@master"
+  urls:
+    - https://huggingface.co/mradermacher/ThinkFL-Llama3-8B-GGUF
+  description: |
+    The model is a quantized version of the official Llama3-8B model, optimized for efficiency with GGUF format. It retains the core capabilities of the original model while being reduced in precision (e.g., Q4_K_S, Q2_K, Q8_0) to lower computational demands. The quantization reduces memory usage and inference speed without sacrificing performance, making it suitable for deployment in resource-constrained environments.
+  overrides:
+    parameters:
+      model: llama-cpp/models/ThinkFL-Llama3-8B.Q4_K_M.gguf
+    name: ThinkFL-Llama3-8B-GGUF
+    backend: llama-cpp
+    template:
+      use_tokenizer_template: true
+    known_usecases:
+      - chat
+    function:
+      grammar:
+        disable: true
+    description: Imported from https://huggingface.co/mradermacher/ThinkFL-Llama3-8B-GGUF
+    options:
+      - use_jinja:true
+  files:
+    - filename: llama-cpp/models/ThinkFL-Llama3-8B.Q4_K_M.gguf
+      sha256: f83a572952eb838c0d38791e53a8b16ac8bb3786560e2f99299f396f130de8eb
+      uri: https://huggingface.co/mradermacher/ThinkFL-Llama3-8B-GGUF/resolve/main/ThinkFL-Llama3-8B.Q4_K_M.gguf
 - name: "lfm2.5-1.2b-nova-function-calling"
   url: "github:mudler/LocalAI/gallery/virtual.yaml@master"
   urls: