depasquale commited on
Commit
7eb9ade
1 Parent(s): 56b6dfd

Fix EOS token

Browse files

I think this will fix the issue below. I'm unsure whether `pad_token` also needs to be changed.

https://github.com/huggingface/swift-transformers/issues/98

Files changed (1) hide show
  1. tokenizer_config.json +1 -1
tokenizer_config.json CHANGED
@@ -118,7 +118,7 @@
118
  "bos_token": "<s>",
119
  "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') %}{{'<|user|>' + '\n' + message['content'] + '<|end|>' + '\n' + '<|assistant|>' + '\n'}}{% elif (message['role'] == 'assistant') %}{{message['content'] + '<|end|>' + '\n'}}{% endif %}{% endfor %}",
120
  "clean_up_tokenization_spaces": false,
121
- "eos_token": "<|endoftext|>",
122
  "legacy": false,
123
  "model_max_length": 4096,
124
  "pad_token": "<|endoftext|>",
 
118
  "bos_token": "<s>",
119
  "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') %}{{'<|user|>' + '\n' + message['content'] + '<|end|>' + '\n' + '<|assistant|>' + '\n'}}{% elif (message['role'] == 'assistant') %}{{message['content'] + '<|end|>' + '\n'}}{% endif %}{% endfor %}",
120
  "clean_up_tokenization_spaces": false,
121
+ "eos_token": "<|end|>",
122
  "legacy": false,
123
  "model_max_length": 4096,
124
  "pad_token": "<|endoftext|>",