Updated Templates supported by llama_chat_apply_template (markdown)

2024-11-22 16:27:58 +01:00 · 2024-03-14 22:11:36 +01:00 · 2024-03-14 22:11:36 +01:00 · 420b3fdda3
commit 420b3fdda3
parent c0eb5b983a
1 changed files with 11 additions and 1 deletions
--- a/Templates-supported-by-llama_chat_apply_template.md
+++ b/Templates-supported-by-llama_chat_apply_template.md
@ -19,6 +19,7 @@ VARIANTS_TO_TEST = [
    'bofenghuang/vigogne-2-70b-chat',
    'mlabonne/AlphaMonarch-7B',
    'google/gemma-7b-it',
+    'OrionStarAI/Orion-14B-Chat',
 ]

 HISTORY = [
@ -34,7 +35,7 @@ for variant in VARIANTS_TO_TEST:
    if 'Mistral' in variant or 'gemma' in variant:
        history.pop(0) # no system prompt for mistral and gemma
    if 'gemma' in variant:
-        # GemmaTokenizer is not yet support by the time this code is written
+        # GemmaTokenizer is quite buggy, let's hard code the template here
        GEMMA_TMLP = "{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}"
        print('Gemma')
        output = AutoTokenizer.from_pretrained(VARIANTS_TO_TEST[0]).apply_chat_template(history, tokenize=False, chat_template=GEMMA_TMLP)
@ -131,6 +132,15 @@ again<|endoftext|>
 response<|endoftext|>
 ```

+```
+Usage: ./server -m ... --chat-template orion
+<s>Human: hello
+
+Assistant: </s>response</s>Human: again
+
+Assistant: </s>response</s>
+```
+
 ## Custom chat templates

 Currently, it's not possible to use your own chat template with llama.cpp server's `/chat/completions`