LGAI-EXAONE
/

EXAONE-4.0-1.2B-GGUF

@@ -20,6 +20,7 @@ library_name: transformers
 <img src="assets/EXAONE_Symbol+BI_3d.png", width="300", style="margin: 40 auto;">
 🎉 License Updated! We are pleased to announce our more flexible licensing terms 🤗
 <br>✈️ Try on <a href="https://friendli.ai/suite/~/serverless-endpoints/LGAI-EXAONE/EXAONE-4.0-32B/overview">FriendliAI</a>
 <br>
 # EXAONE-4.0-1.2B-GGUF
@@ -53,11 +54,7 @@ For more details, please refer to our [technical report](https://arxiv.org/abs/2
 ### llama.cpp
 You can run EXAONE models locally using llama.cpp by following these steps:
-1. Install the latest version of llama.cpp, by cloning the our PR and building from source. Please refer to the official documentation about [building from source](https://github.com/ggml-org/llama.cpp/blob/master/docs/build.md).
-```bash
-git clone --single-branch -b add-exaone4 https://github.com/lgai-exaone/llama.cpp.git
-```
 2. Download the EXAONE 4.0 model weights in GGUF format.
@@ -108,12 +105,12 @@ git clone --single-branch -b add-exaone4 https://github.com/lgai-exaone/llama.cp
 <details>
 <summary>OpenAI compatible server with `llama-server`</summary>
-3. Run llama-server with EXAONE 4.0 Jinja template.
     ```bash
     llama-server -m EXAONE-4.0-32B-Q4_K_M.gguf \
         -c 131072 -fa -ngl 64 \
         --temp 0.6 --top-p 0.95 \
-        --jinja --chat-template-format chat_template_simple.jinja \
         --host 0.0.0.0 --port 8820 \
         -a EXAONE-4.0-32B-Q4_K_M
     ```

 <img src="assets/EXAONE_Symbol+BI_3d.png", width="300", style="margin: 40 auto;">
 🎉 License Updated! We are pleased to announce our more flexible licensing terms 🤗
 <br>✈️ Try on <a href="https://friendli.ai/suite/~/serverless-endpoints/LGAI-EXAONE/EXAONE-4.0-32B/overview">FriendliAI</a>
+<br><br><i>📢 EXAONE 4.0 is officially supported by llama.cpp! Please check the guide <a href="#quickstart-gguf">below</a></i>
 <br>
 # EXAONE-4.0-1.2B-GGUF
 ### llama.cpp
 You can run EXAONE models locally using llama.cpp by following these steps:
+1. Install the latest version of llama.cpp (version >= `b5932`). Please check the official [installation guide](https://github.com/ggml-org/llama.cpp?tab=readme-ov-file#quick-start) from llama.cpp.
 2. Download the EXAONE 4.0 model weights in GGUF format.
 <details>
 <summary>OpenAI compatible server with `llama-server`</summary>
+3. Run llama-server with EXAONE 4.0 Jinja template. You can find the [chat template file](https://huggingface.co/LGAI-EXAONE/EXAONE-4.0-1.2B-GGUF/blob/main/chat_template.jinja) in this repository.
     ```bash
     llama-server -m EXAONE-4.0-32B-Q4_K_M.gguf \
         -c 131072 -fa -ngl 64 \
         --temp 0.6 --top-p 0.95 \
+        --jinja --chat-template-format chat_template.jinja \
         --host 0.0.0.0 --port 8820 \
         -a EXAONE-4.0-32B-Q4_K_M
     ```

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,146 @@

+{%- if not skip_think is defined %}
+  {%- set skip_think = true %}
+{%- endif %}
+{%- set role_indicators = {
+    'user': '[|user|]\n',
+    'assistant': '[|assistant|]\n',
+    'system': '[|system|]\n',
+    'tool': '[|tool|]\n'
+} %}
+{%- set end_of_turn = '[|endofturn|]\n' %}
+{%- macro available_tools(tools) %}
+    {{- "# Available Tools" }}
+    {{- "\nYou can use none, one, or multiple of the following tools by calling them as functions to help with the user’s query." }}
+    {{- "\nHere are the tools available to you in JSON format within <tool> and </tool> tags:\n" }}
+    {%- for tool in tools %}
+        {{- "<tool>" }}
+        {{- tool | tojson(ensure_ascii=False) | safe }}
+        {{- "</tool>\n" }}
+    {%- endfor %}
+    {{- "\nFor each function call you want to make, return a JSON object with function name and arguments within <tool_call> and </tool_call> tags, like:" }}
+    {{- "\n<tool_call>{\"name\": function_1_name, \"arguments\": {argument_1_name: argument_1_value, argument_2_name: argument_2_value}}</tool_call>" }}
+    {{- "\n<tool_call>{\"name\": function_2_name, \"arguments\": {...}}</tool_call>\n..." }}
+    {{- "\nNote that if no argument name is specified for a tool, you can just print the argument value directly, without the argument name or JSON formatting." }}
+{%- endmacro %}
+{%- set ns = namespace(last_query_index = messages|length - 1) %}
+{%- for message in messages %}
+    {%- if message.role == "user" and message.content is string %}
+        {%- set ns.last_query_index = loop.index0 -%}
+    {%- endif %}
+{%- endfor %}
+{%- for i in range(messages | length) %}
+    {%- set msg = messages[i] %}
+    {%- set role = msg.role %}
+    {% if role is not none and role.class is not none and role not in role_indicators %}
+        {{- raise_exception('Unknown role: ' ~ role) }}
+    {%- endif %}
+    {%- if i == 0 %}
+        {%- if role == 'system' %}
+            {{- role_indicators['system'] }}
+            {{- msg.content }}
+            {%- if tools is defined and tools %}
+                {{- "\n\n" }}{{- available_tools(tools) }}
+            {%- endif %}
+            {{- end_of_turn -}}
+            {%- continue %}
+        {%- elif tools is defined and tools %}
+            {{- role_indicators['system'] }}
+            {{- available_tools(tools) }}
+            {{- end_of_turn -}}
+        {%- endif %}
+    {%- endif %}
+    {%- if role == 'assistant' %}
+        {{- role_indicators['assistant'] }}
+        {%- if msg.content %}
+            {%- if "</think>" in msg.content %}
+                {%- set content = msg.content.split('</think>')[-1].strip() %}
+                {%- set reasoning_content = msg.content.split('</think>')[0].strip() %}
+                {%- if reasoning_content.startswith("<think>") %}
+                    {%- set reasoning_content = reasoning_content[9:].strip() %}
+                {%- endif %}
+            {%- else %}
+                {%- set content = msg.content %}
+            {%- endif %}
+            {%- if msg.reasoning_content %}
+                {%- set reasoning_content = msg.reasoning_content %}
+            {%- endif %}
+            {%- if (not skip_think and loop.last) and reasoning_content is defined %}
+                {{- "<think>\n" }}
+                {{- reasoning_content}}
+                {{- "\n</think>\n\n" }}
+            {%- else %}
+                {{- "<think>\n\n</think>\n\n" }}
+            {%- endif %}
+            {{- content }}
+        {%- endif %}
+        {%- if msg.tool_calls %}
+            {%- if msg.content %}
+                {{- "\n" }}
+            {%- else %}
+                {{- "<think>\n\n</think>\n\n" }}
+            {%- endif %}
+            {%- for tool_call in msg.tool_calls %}
+                {%- if tool_call.function is defined %}
+                    {%- set tool_call = tool_call.function %}
+                {%- endif %}
+                {%- if tool_call.arguments is defined %}
+                    {%- set arguments = tool_call.arguments %}
+                {%- elif tool_call.parameters is defined %}
+                    {%- set arguments = tool_call.parameters %}
+                {%- else %}
+                    {{- raise_exception('arguments or parameters are mandatory: ' ~ tool_call) }}
+                {%- endif %}
+                {{- "<tool_call>" }}{"name": "{{- tool_call.name }}", "arguments": {{ arguments | tojson(ensure_ascii=False) | safe }}}{{- "</tool_call>" }}
+                {%- if not loop.last %}
+                    {{- "\n" }}
+                {%- endif %}
+            {%- endfor %}
+        {%- endif %}
+        {{- end_of_turn -}}
+    {%- elif role == "tool" %}
+        {%- if i == 0 or messages[i - 1].role != "tool" %}
+            {{- role_indicators['tool'] }}
+        {%- endif %}
+        {%- if msg.content is defined %}
+            {{- "<tool_result>" }}{"result": {{ msg.content | tojson(ensure_ascii=False) | safe }}}{{- "</tool_result>" }}
+        {%- endif %}
+        {%- if loop.last or messages[i + 1].role != "tool" %}
+            {{- end_of_turn -}}
+        {%- else %}
+            {{- "\n" }}
+        {%- endif %}
+    {%- else %}
+        {{- role_indicators[role] }}
+        {{- msg.content }}
+        {{- end_of_turn -}}
+    {%- endif %}
+{% endfor %}
+{%- if add_generation_prompt %}
+    {{- role_indicators['assistant'] }}
+    {%- if enable_thinking is defined and enable_thinking is true %}
+        {{- "<think>\n" }}
+    {%- else %}
+        {{- "<think>\n\n</think>\n\n" }}
+    {%- endif %}
+{%- endif %}