add additional_special_tokens in tokenizer cfg
Browse files- tokenizer_config.json +8 -0
tokenizer_config.json
CHANGED
@@ -86,5 +86,13 @@
|
|
86 |
"special": true
|
87 |
}
|
88 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
89 |
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
90 |
}
|
|
|
86 |
"special": true
|
87 |
}
|
88 |
},
|
89 |
+
"additional_special_tokens": [
|
90 |
+
"<|im_start|>",
|
91 |
+
"<|im_end|>",
|
92 |
+
"<|action_start|>",
|
93 |
+
"<|action_end|>",
|
94 |
+
"<|interpreter|>",
|
95 |
+
"<|plugin|>"
|
96 |
+
],
|
97 |
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
98 |
}
|