chore(model gallery): add ai21labs_ai21-jamba-reasoning-3b

mudler · mudler · commit 06f20fe40016 · 2025-10-09T12:57:27.000+02:00
Signed-off-by: Ettore Di Giacinto &lt;mudler@localai.io&gt;
diff --git a/gallery/index.yaml b/gallery/index.yaml
@@ -1,4 +1,29 @@
 ---
+- &jamba
+  icon: https://cdn-avatars.huggingface.co/v1/production/uploads/65e60c0ed5313c06372446ff/QwehUHgP2HtVAMW5MzJ2j.png
+  name: "ai21labs_ai21-jamba-reasoning-3b"
+  url: "github:mudler/LocalAI/gallery/jamba.yaml@master"
+  license: apache-2.0
+  tags:
+    - gguf
+    - GPU
+    - CPU
+    - text-to-text
+    - jamba
+    - mamba
+  urls:
+    - https://huggingface.co/ai21labs/AI21-Jamba-Reasoning-3B
+    - https://huggingface.co/bartowski/ai21labs_AI21-Jamba-Reasoning-3B-GGUF
+  description: |
+      AI21’s Jamba Reasoning 3B is a top-performing reasoning model that packs leading scores on intelligence benchmarks and highly-efficient processing into a compact 3B build.
+      The hybrid design combines Transformer attention with Mamba (a state-space model). Mamba layers are more efficient for sequence processing, while attention layers capture complex dependencies. This mix reduces memory overhead, improves throughput, and makes the model run smoothly on laptops, GPUs, and even mobile devices, while maintainig impressive quality.
+  overrides:
+    parameters:
+      model: ai21labs_AI21-Jamba-Reasoning-3B-Q4_K_M.gguf
+  files:
+    - filename: ai21labs_AI21-Jamba-Reasoning-3B-Q4_K_M.gguf
+      sha256: ac7ec0648dea62d1efb5ef6e7268c748ffc71f1c26eebe97eccff0a8d41608e6
+      uri: huggingface://bartowski/ai21labs_AI21-Jamba-Reasoning-3B-GGUF/ai21labs_AI21-Jamba-Reasoning-3B-Q4_K_M.gguf
 - &granite4
   url: "github:mudler/LocalAI/gallery/granite4.yaml@master"
   name: "ibm-granite_granite-4.0-h-small"
diff --git a/gallery/jamba.yaml b/gallery/jamba.yaml
@@ -0,0 +1,49 @@
+---
+name: "jamba"
+
+config_file: |
+  mmap: true
+  backend: "llama-cpp"
+  template:
+    chat_message: |
+      <|im_start|>{{if eq .RoleName "tool" }}user{{else}}{{ .RoleName }}{{end}}
+      {{ if eq .RoleName "tool" -}}
+      <tool_response>
+      {{ end -}}
+      {{ if .Content -}}
+      {{.Content }}
+      {{ end -}}
+      {{ if eq .RoleName "tool" -}}
+      </tool_response>
+      {{ end -}}
+      {{ if .FunctionCall -}}
+      <tool_call>
+      {{toJson .FunctionCall}}
+      </tool_call>
+      {{ end -}}<|im_end|>
+    function: |
+      <|im_start|>system
+      # Tools
+      You may call one or more functions to assist with the user query.
+      You are provided with function signatures within <tools></tools> XML tags:
+      <tools>
+      {{range .Functions}}
+      {'type': 'function', 'function': {'name': '{{.Name}}', 'description': '{{.Description}}', 'parameters': {{toJson .Parameters}} }}
+      {{end}}
+      </tools>
+      <|im_end|>
+      {{.Input -}}
+      <|im_start|>assistant
+    chat: |
+      {{.Input -}}
+      <|im_start|>assistant
+      <think>
+    completion: |
+      {{.Input}}
+  context_size: 8192
+  f16: true
+  stopwords:
+  - '<|im_end|>'
+  - '<dummy32000>'
+  - '</s>'
+  - '<|endoftext|>'