doubledsbv commited on
Commit
a737d48
1 Parent(s): fc7ea43

Upload tokenizer

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. special_tokens_map.json +1 -7
  3. tokenizer.json +0 -27
  4. tokenizer_config.json +1 -1
README.md CHANGED
@@ -1,15 +1,15 @@
1
  ---
 
 
 
2
  library_name: transformers
3
  tags:
4
  - deutsch
5
  - german
6
  - seedbox
7
  - mistral
8
- license: apache-2.0
9
  datasets:
10
  - seedboxai/multitask_german_examples_32k
11
- language:
12
- - de
13
  pipeline_tag: text-generation
14
  ---
15
 
 
1
  ---
2
+ language:
3
+ - de
4
+ license: apache-2.0
5
  library_name: transformers
6
  tags:
7
  - deutsch
8
  - german
9
  - seedbox
10
  - mistral
 
11
  datasets:
12
  - seedboxai/multitask_german_examples_32k
 
 
13
  pipeline_tag: text-generation
14
  ---
15
 
special_tokens_map.json CHANGED
@@ -18,13 +18,7 @@
18
  "rstrip": false,
19
  "single_word": false
20
  },
21
- "pad_token": {
22
- "content": "<unk>",
23
- "lstrip": false,
24
- "normalized": false,
25
- "rstrip": false,
26
- "single_word": false
27
- },
28
  "unk_token": {
29
  "content": "<unk>",
30
  "lstrip": false,
 
18
  "rstrip": false,
19
  "single_word": false
20
  },
21
+ "pad_token": "<unk>",
 
 
 
 
 
 
22
  "unk_token": {
23
  "content": "<unk>",
24
  "lstrip": false,
tokenizer.json CHANGED
@@ -67,12 +67,6 @@
67
  "id": "A",
68
  "type_id": 0
69
  }
70
- },
71
- {
72
- "SpecialToken": {
73
- "id": "</s>",
74
- "type_id": 0
75
- }
76
  }
77
  ],
78
  "pair": [
@@ -88,12 +82,6 @@
88
  "type_id": 0
89
  }
90
  },
91
- {
92
- "SpecialToken": {
93
- "id": "</s>",
94
- "type_id": 0
95
- }
96
- },
97
  {
98
  "SpecialToken": {
99
  "id": "<s>",
@@ -105,24 +93,9 @@
105
  "id": "B",
106
  "type_id": 1
107
  }
108
- },
109
- {
110
- "SpecialToken": {
111
- "id": "</s>",
112
- "type_id": 1
113
- }
114
  }
115
  ],
116
  "special_tokens": {
117
- "</s>": {
118
- "id": "</s>",
119
- "ids": [
120
- 2
121
- ],
122
- "tokens": [
123
- "</s>"
124
- ]
125
- },
126
  "<s>": {
127
  "id": "<s>",
128
  "ids": [
 
67
  "id": "A",
68
  "type_id": 0
69
  }
 
 
 
 
 
 
70
  }
71
  ],
72
  "pair": [
 
82
  "type_id": 0
83
  }
84
  },
 
 
 
 
 
 
85
  {
86
  "SpecialToken": {
87
  "id": "<s>",
 
93
  "id": "B",
94
  "type_id": 1
95
  }
 
 
 
 
 
 
96
  }
97
  ],
98
  "special_tokens": {
 
 
 
 
 
 
 
 
 
99
  "<s>": {
100
  "id": "<s>",
101
  "ids": [
tokenizer_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "add_bos_token": true,
3
- "add_eos_token": true,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
1
  {
2
  "add_bos_token": true,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",