msharma95 Raj-Sanjay-Shah commited on
Commit
8c146bb
1 Parent(s): c289364

Update tokenizer_config.json (#5)

Browse files

- Update tokenizer_config.json (6086e7b7051c9a15b5d1e8436e34de2a6e4b1277)


Co-authored-by: Raj Sanjay Shah <Raj-Sanjay-Shah@users.noreply.huggingface.co>

Files changed (1) hide show
  1. tokenizer_config.json +2 -9
tokenizer_config.json CHANGED
@@ -43,21 +43,14 @@
43
  "special": true
44
  }
45
  },
46
- "bos_token": {
47
- "content": "<s>",
48
- "single_word": false,
49
- "lstrip": false,
50
- "rstrip": false,
51
- "normalized": true,
52
- "__type": "AddedToken"
53
- },
54
  "clean_up_tokenization_spaces": true,
55
  "cls_token": "<s>",
56
  "eos_token": "</s>",
57
  "errors": "replace",
58
  "mask_token": "<mask>",
59
  "max_length": 128,
60
- "model_max_length": 1e+30,
61
  "pad_to_multiple_of": null,
62
  "pad_token": "<pad>",
63
  "pad_token_type_id": 0,
 
43
  "special": true
44
  }
45
  },
46
+ "bos_token": "<s>",
 
 
 
 
 
 
 
47
  "clean_up_tokenization_spaces": true,
48
  "cls_token": "<s>",
49
  "eos_token": "</s>",
50
  "errors": "replace",
51
  "mask_token": "<mask>",
52
  "max_length": 128,
53
+ "model_max_length":1e+30,
54
  "pad_to_multiple_of": null,
55
  "pad_token": "<pad>",
56
  "pad_token_type_id": 0,