Jana0511 commited on
Commit
091b3ee
1 Parent(s): 99748ae

Upload tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +2 -2
  2. vocab.json +13 -15
added_tokens.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "</s>": 46,
3
- "<s>": 45
4
  }
 
1
  {
2
+ "</s>": 44,
3
+ "<s>": 43
4
  }
vocab.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "[PAD]": 44,
3
- "[UNK]": 43,
4
  "a": 1,
5
  "b": 2,
6
  "c": 3,
@@ -31,17 +31,15 @@
31
  "¬": 27,
32
  "à": 28,
33
  "á": 29,
34
- "â": 30,
35
- "ä": 31,
36
- "é": 32,
37
- "ë": 33,
38
- "ï": 34,
39
- "ñ": 35,
40
- "ò": 36,
41
- "ö": 37,
42
- "û": 38,
43
- "ÿ": 39,
44
- "ŵ": 40,
45
- "–": 41,
46
- "—": 42
47
  }
 
1
  {
2
+ "[PAD]": 42,
3
+ "[UNK]": 41,
4
  "a": 1,
5
  "b": 2,
6
  "c": 3,
 
31
  "¬": 27,
32
  "à": 28,
33
  "á": 29,
34
+ "ä": 30,
35
+ "é": 31,
36
+ "ë": 32,
37
+ "ï": 33,
38
+ "ñ": 34,
39
+ "ò": 35,
40
+ "ö": 36,
41
+ "û": 37,
42
+ "ÿ": 38,
43
+ "": 39,
44
+ "": 40
 
 
45
  }