Scaling-Laws-for-Local-SGD-in-LLM-Intermediate-Checkpoints
/
base
/base_0.012b
/tokenizer_config.json
{ | |
"add_bos_token": false, | |
"add_eos_token": false, | |
"bos_token": { | |
"__type": "AddedToken", | |
"content": "<|begin▁of▁sentence|>", | |
"lstrip": false, | |
"normalized": true, | |
"rstrip": false, | |
"single_word": false | |
}, | |
"clean_up_tokenization_spaces": false, | |
"eos_token": { | |
"__type": "AddedToken", | |
"content": "<|end▁of▁sentence|>", | |
"lstrip": false, | |
"normalized": true, | |
"rstrip": false, | |
"single_word": false | |
}, | |
"legacy": true, | |
"model_max_length": 4096, | |
"pad_token": { | |
"__type": "AddedToken", | |
"content": "<|end▁of▁sentence|>", | |
"lstrip": false, | |
"normalized": true, | |
"rstrip": false, | |
"single_word": false | |
}, | |
"sp_model_kwargs": {}, | |
"unk_token": null, | |
"tokenizer_class": "LlamaTokenizerFast" | |
} | |