chat template + correct gen eos
Browse files- chat_template.jinja +15 -89
- generation_config.json +2 -3
chat_template.jinja
CHANGED
|
@@ -1,93 +1,19 @@
|
|
| 1 |
-
{
|
| 2 |
-
{%- if custom_tools is defined %}
|
| 3 |
-
{%- set tools = custom_tools %}
|
| 4 |
-
{%- endif %}
|
| 5 |
-
{%- if not tools_in_user_message is defined %}
|
| 6 |
-
{%- set tools_in_user_message = true %}
|
| 7 |
-
{%- endif %}
|
| 8 |
-
{%- if not date_string is defined %}
|
| 9 |
-
{%- if strftime_now is defined %}
|
| 10 |
-
{%- set date_string = strftime_now("%d %b %Y") %}
|
| 11 |
-
{%- else %}
|
| 12 |
-
{%- set date_string = "26 Jul 2024" %}
|
| 13 |
-
{%- endif %}
|
| 14 |
-
{%- endif %}
|
| 15 |
-
{%- if not tools is defined %}
|
| 16 |
-
{%- set tools = none %}
|
| 17 |
-
{%- endif %}
|
| 18 |
|
| 19 |
-
{
|
| 20 |
-
{%- if messages[0]['role'] == 'system' %}
|
| 21 |
-
{%- set system_message = messages[0]['content']|trim %}
|
| 22 |
-
{%- set messages = messages[1:] %}
|
| 23 |
-
{%- else %}
|
| 24 |
-
{%- set system_message = "" %}
|
| 25 |
-
{%- endif %}
|
| 26 |
|
| 27 |
-
{
|
| 28 |
-
{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
|
| 29 |
-
{%- if tools is not none %}
|
| 30 |
-
{{- "Environment: ipython\n" }}
|
| 31 |
-
{%- endif %}
|
| 32 |
-
{{- "Cutting Knowledge Date: December 2023\n" }}
|
| 33 |
-
{{- "Today Date: " + date_string + "\n\n" }}
|
| 34 |
-
{%- if tools is not none and not tools_in_user_message %}
|
| 35 |
-
{{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
|
| 36 |
-
{{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
|
| 37 |
-
{{- "Do not use variables.\n\n" }}
|
| 38 |
-
{%- for t in tools %}
|
| 39 |
-
{{- t | tojson(indent=4) }}
|
| 40 |
-
{{- "\n\n" }}
|
| 41 |
-
{%- endfor %}
|
| 42 |
-
{%- endif %}
|
| 43 |
-
{{- system_message }}
|
| 44 |
-
{{- "<|eot_id|>" }}
|
| 45 |
|
| 46 |
-
{
|
| 47 |
-
{%- if tools_in_user_message and not tools is none %}
|
| 48 |
-
{#- Extract the first user message so we can plug it in here #}
|
| 49 |
-
{%- if messages | length != 0 %}
|
| 50 |
-
{%- set first_user_message = messages[0]['content']|trim %}
|
| 51 |
-
{%- set messages = messages[1:] %}
|
| 52 |
-
{%- else %}
|
| 53 |
-
{{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
|
| 54 |
-
{%- endif %}
|
| 55 |
-
{{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
|
| 56 |
-
{{- "Given the following functions, please respond with a JSON for a function call " }}
|
| 57 |
-
{{- "with its proper arguments that best answers the given prompt.\n\n" }}
|
| 58 |
-
{{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
|
| 59 |
-
{{- "Do not use variables.\n\n" }}
|
| 60 |
-
{%- for t in tools %}
|
| 61 |
-
{{- t | tojson(indent=4) }}
|
| 62 |
-
{{- "\n\n" }}
|
| 63 |
-
{%- endfor %}
|
| 64 |
-
{{- first_user_message + "<|eot_id|>"}}
|
| 65 |
-
{%- endif %}
|
| 66 |
|
| 67 |
-
{%- for message in messages
|
| 68 |
-
{%-
|
| 69 |
-
{{-
|
| 70 |
-
{%- elif '
|
| 71 |
-
{
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
| 75 |
-
|
| 76 |
-
|
| 77 |
-
|
| 78 |
-
{{- tool_call.arguments | tojson }}
|
| 79 |
-
{{- "}" }}
|
| 80 |
-
{{- "<|eot_id|>" }}
|
| 81 |
-
{%- elif message.role == "tool" or message.role == "ipython" %}
|
| 82 |
-
{{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
|
| 83 |
-
{%- if message.content is mapping or message.content is iterable %}
|
| 84 |
-
{{- message.content | tojson }}
|
| 85 |
-
{%- else %}
|
| 86 |
-
{{- message.content }}
|
| 87 |
-
{%- endif %}
|
| 88 |
-
{{- "<|eot_id|>" }}
|
| 89 |
-
{%- endif %}
|
| 90 |
-
{%- endfor %}
|
| 91 |
-
{%- if add_generation_prompt %}
|
| 92 |
-
{{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
|
| 93 |
-
{%- endif %}
|
|
|
|
| 1 |
+
{%- set begin_transcript = "<custom_token_3><|begin_of_text|>" -%}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
|
| 3 |
+
{%- set end_transcript = "<|eot_id|><custom_token_4>" -%}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
|
| 5 |
+
{%- set begin_audio = "<custom_token_5><custom_token_1>" -%}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6 |
|
| 7 |
+
{%- set end_audio = "<custom_token_2><custom_token_6>" -%}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8 |
|
| 9 |
+
{%- for message in messages -%}
|
| 10 |
+
{%- if message.role == 'user' -%}
|
| 11 |
+
{{- begin_transcript + message['content'] | trim + end_transcript -}}
|
| 12 |
+
{%- elif message.role == 'assistant' -%}
|
| 13 |
+
{{- begin_audio + message['content'] | trim + end_audio -}}
|
| 14 |
+
{%- endif -%}
|
| 15 |
+
{%- endfor -%}
|
| 16 |
+
|
| 17 |
+
{%- if add_generation_prompt -%}
|
| 18 |
+
{{- begin_audio -}}
|
| 19 |
+
{%- endif -%}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
generation_config.json
CHANGED
|
@@ -2,8 +2,7 @@
|
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 128000,
|
| 4 |
"do_sample": true,
|
| 5 |
-
"eos_token_id":
|
| 6 |
-
"temperature": 0.
|
| 7 |
-
"top_p": 0.9,
|
| 8 |
"transformers_version": "4.52.4"
|
| 9 |
}
|
|
|
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 128000,
|
| 4 |
"do_sample": true,
|
| 5 |
+
"eos_token_id": 128258,
|
| 6 |
+
"temperature": 0.7,
|
|
|
|
| 7 |
"transformers_version": "4.52.4"
|
| 8 |
}
|