dougtrajano commited on
Commit
f3a8e1e
1 Parent(s): 024565b

Model save

Browse files
last-checkpoint/config.json DELETED
@@ -1,40 +0,0 @@
1
- {
2
- "_name_or_path": "neuralmind/bert-base-portuguese-cased",
3
- "architectures": [
4
- "ToxicityTypeForSequenceClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "directionality": "bidi",
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
- "id2label": {
13
- "0": "NOT-OFFENSIVE",
14
- "1": "OFFENSIVE"
15
- },
16
- "initializer_range": 0.02,
17
- "intermediate_size": 3072,
18
- "label2id": {
19
- "NOT-OFFENSIVE": 0,
20
- "OFFENSIVE": 1
21
- },
22
- "layer_norm_eps": 1e-12,
23
- "max_position_embeddings": 512,
24
- "model_type": "bert",
25
- "num_attention_heads": 12,
26
- "num_hidden_layers": 12,
27
- "output_past": true,
28
- "pad_token_id": 0,
29
- "pooler_fc_size": 768,
30
- "pooler_num_attention_heads": 12,
31
- "pooler_num_fc_layers": 3,
32
- "pooler_size_per_head": 128,
33
- "pooler_type": "first_token_transform",
34
- "position_embedding_type": "absolute",
35
- "torch_dtype": "float32",
36
- "transformers_version": "4.26.0",
37
- "type_vocab_size": 2,
38
- "use_cache": true,
39
- "vocab_size": 29794
40
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3abd9e432cd17aa227c77a4602995a7d44a2d5b8db7d09756643847c4bdb3b4a
3
- size 871513885
 
 
 
 
last-checkpoint/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea0028124c16c42b0173d84c15dfc6aaf99389e964846d869e1df752e59e8dec
3
- size 435769709
 
 
 
 
last-checkpoint/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:69726e2727b419acf15202f62187cf0581b6c2bfd7c023bc96716f05fa3e0d08
3
- size 14503
 
 
 
 
last-checkpoint/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c784665c0bd4de01cbb7e9c50f86d2b0ebff72eead0e3ffd23f231c6475b92bf
3
- size 623
 
 
 
 
last-checkpoint/special_tokens_map.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
7
- }
 
 
 
 
 
 
 
 
last-checkpoint/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/tokenizer_config.json DELETED
@@ -1,16 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "do_basic_tokenize": true,
4
- "do_lower_case": false,
5
- "mask_token": "[MASK]",
6
- "model_max_length": 1000000000000000019884624838656,
7
- "name_or_path": "neuralmind/bert-base-portuguese-cased",
8
- "never_split": null,
9
- "pad_token": "[PAD]",
10
- "sep_token": "[SEP]",
11
- "special_tokens_map_file": "/root/.cache/huggingface/hub/models--neuralmind--bert-base-portuguese-cased/snapshots/94d69c95f98f7d5b2a8700c420230ae10def0baa/special_tokens_map.json",
12
- "strip_accents": null,
13
- "tokenize_chinese_chars": true,
14
- "tokenizer_class": "BertTokenizer",
15
- "unk_token": "[UNK]"
16
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/trainer_state.json DELETED
@@ -1,274 +0,0 @@
1
- {
2
- "best_metric": 0.8580479726153486,
3
- "best_model_checkpoint": "./output/toxic-comment-classification-2023-02-12-03-38-39-438/model/checkpoint-5632",
4
- "epoch": 9.0,
5
- "global_step": 12672,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.36,
12
- "learning_rate": 3.217249581414747e-05,
13
- "loss": 0.4962,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 0.71,
18
- "learning_rate": 3.1787104153700095e-05,
19
- "loss": 0.4422,
20
- "step": 1000
21
- },
22
- {
23
- "epoch": 1.0,
24
- "eval_accuracy": 0.8465608465608465,
25
- "eval_f1": 0.846971473226303,
26
- "eval_loss": 0.4196861684322357,
27
- "eval_precision": 0.8505491368402285,
28
- "eval_recall": 0.8465608465608465,
29
- "eval_runtime": 14.7315,
30
- "eval_samples_per_second": 218.104,
31
- "eval_steps_per_second": 27.288,
32
- "step": 1408
33
- },
34
- {
35
- "epoch": 1.07,
36
- "learning_rate": 3.140171249325271e-05,
37
- "loss": 0.424,
38
- "step": 1500
39
- },
40
- {
41
- "epoch": 1.42,
42
- "learning_rate": 3.1016320832805326e-05,
43
- "loss": 0.3631,
44
- "step": 2000
45
- },
46
- {
47
- "epoch": 1.78,
48
- "learning_rate": 3.063092917235795e-05,
49
- "loss": 0.3566,
50
- "step": 2500
51
- },
52
- {
53
- "epoch": 2.0,
54
- "eval_accuracy": 0.8412698412698413,
55
- "eval_f1": 0.8394018830559876,
56
- "eval_loss": 0.47242870926856995,
57
- "eval_precision": 0.8453384370339388,
58
- "eval_recall": 0.8412698412698413,
59
- "eval_runtime": 15.5699,
60
- "eval_samples_per_second": 206.359,
61
- "eval_steps_per_second": 25.819,
62
- "step": 2816
63
- },
64
- {
65
- "epoch": 2.13,
66
- "learning_rate": 3.0245537511910564e-05,
67
- "loss": 0.3359,
68
- "step": 3000
69
- },
70
- {
71
- "epoch": 2.49,
72
- "learning_rate": 2.986014585146318e-05,
73
- "loss": 0.3024,
74
- "step": 3500
75
- },
76
- {
77
- "epoch": 2.84,
78
- "learning_rate": 2.9474754191015798e-05,
79
- "loss": 0.3135,
80
- "step": 4000
81
- },
82
- {
83
- "epoch": 3.0,
84
- "eval_accuracy": 0.844693432928727,
85
- "eval_f1": 0.8433530690879544,
86
- "eval_loss": 0.48013588786125183,
87
- "eval_precision": 0.8469664276626117,
88
- "eval_recall": 0.844693432928727,
89
- "eval_runtime": 15.5293,
90
- "eval_samples_per_second": 206.899,
91
- "eval_steps_per_second": 25.887,
92
- "step": 4224
93
- },
94
- {
95
- "epoch": 3.2,
96
- "learning_rate": 2.9089362530568417e-05,
97
- "loss": 0.2789,
98
- "step": 4500
99
- },
100
- {
101
- "epoch": 3.55,
102
- "learning_rate": 2.8703970870121032e-05,
103
- "loss": 0.263,
104
- "step": 5000
105
- },
106
- {
107
- "epoch": 3.91,
108
- "learning_rate": 2.831857920967365e-05,
109
- "loss": 0.2638,
110
- "step": 5500
111
- },
112
- {
113
- "epoch": 4.0,
114
- "eval_accuracy": 0.8577653283535637,
115
- "eval_f1": 0.8580479726153486,
116
- "eval_loss": 0.5590450167655945,
117
- "eval_precision": 0.8593690748266627,
118
- "eval_recall": 0.8577653283535637,
119
- "eval_runtime": 15.5871,
120
- "eval_samples_per_second": 206.132,
121
- "eval_steps_per_second": 25.791,
122
- "step": 5632
123
- },
124
- {
125
- "epoch": 4.26,
126
- "learning_rate": 2.793318754922627e-05,
127
- "loss": 0.2316,
128
- "step": 6000
129
- },
130
- {
131
- "epoch": 4.62,
132
- "learning_rate": 2.7547795888778885e-05,
133
- "loss": 0.2292,
134
- "step": 6500
135
- },
136
- {
137
- "epoch": 4.97,
138
- "learning_rate": 2.7162404228331504e-05,
139
- "loss": 0.2314,
140
- "step": 7000
141
- },
142
- {
143
- "epoch": 5.0,
144
- "eval_accuracy": 0.8490507314036726,
145
- "eval_f1": 0.8487038312585119,
146
- "eval_loss": 0.5605392456054688,
147
- "eval_precision": 0.848937798685001,
148
- "eval_recall": 0.8490507314036726,
149
- "eval_runtime": 14.9336,
150
- "eval_samples_per_second": 215.153,
151
- "eval_steps_per_second": 26.919,
152
- "step": 7040
153
- },
154
- {
155
- "epoch": 5.33,
156
- "learning_rate": 2.6777012567884123e-05,
157
- "loss": 0.1992,
158
- "step": 7500
159
- },
160
- {
161
- "epoch": 5.68,
162
- "learning_rate": 2.6391620907436738e-05,
163
- "loss": 0.2221,
164
- "step": 8000
165
- },
166
- {
167
- "epoch": 6.0,
168
- "eval_accuracy": 0.8415810768751946,
169
- "eval_f1": 0.8413911882051015,
170
- "eval_loss": 0.6368530988693237,
171
- "eval_precision": 0.8413807388640939,
172
- "eval_recall": 0.8415810768751946,
173
- "eval_runtime": 14.6321,
174
- "eval_samples_per_second": 219.586,
175
- "eval_steps_per_second": 27.474,
176
- "step": 8448
177
- },
178
- {
179
- "epoch": 6.04,
180
- "learning_rate": 2.600622924698936e-05,
181
- "loss": 0.2064,
182
- "step": 8500
183
- },
184
- {
185
- "epoch": 6.39,
186
- "learning_rate": 2.5620837586541976e-05,
187
- "loss": 0.1943,
188
- "step": 9000
189
- },
190
- {
191
- "epoch": 6.75,
192
- "learning_rate": 2.5235445926094595e-05,
193
- "loss": 0.1939,
194
- "step": 9500
195
- },
196
- {
197
- "epoch": 7.0,
198
- "eval_accuracy": 0.8400248988484282,
199
- "eval_f1": 0.8401859753110656,
200
- "eval_loss": 0.6518161296844482,
201
- "eval_precision": 0.8405358987959715,
202
- "eval_recall": 0.8400248988484282,
203
- "eval_runtime": 15.2445,
204
- "eval_samples_per_second": 210.764,
205
- "eval_steps_per_second": 26.37,
206
- "step": 9856
207
- },
208
- {
209
- "epoch": 7.1,
210
- "learning_rate": 2.4850054265647214e-05,
211
- "loss": 0.2117,
212
- "step": 10000
213
- },
214
- {
215
- "epoch": 7.46,
216
- "learning_rate": 2.446466260519983e-05,
217
- "loss": 0.198,
218
- "step": 10500
219
- },
220
- {
221
- "epoch": 7.81,
222
- "learning_rate": 2.4079270944752448e-05,
223
- "loss": 0.2015,
224
- "step": 11000
225
- },
226
- {
227
- "epoch": 8.0,
228
- "eval_accuracy": 0.8462496109554933,
229
- "eval_f1": 0.8456511274707091,
230
- "eval_loss": 0.6041903495788574,
231
- "eval_precision": 0.8464673674599805,
232
- "eval_recall": 0.8462496109554933,
233
- "eval_runtime": 14.8589,
234
- "eval_samples_per_second": 216.234,
235
- "eval_steps_per_second": 27.054,
236
- "step": 11264
237
- },
238
- {
239
- "epoch": 8.17,
240
- "learning_rate": 2.3693879284305067e-05,
241
- "loss": 0.1896,
242
- "step": 11500
243
- },
244
- {
245
- "epoch": 8.52,
246
- "learning_rate": 2.3308487623857682e-05,
247
- "loss": 0.1932,
248
- "step": 12000
249
- },
250
- {
251
- "epoch": 8.88,
252
- "learning_rate": 2.29230959634103e-05,
253
- "loss": 0.1989,
254
- "step": 12500
255
- },
256
- {
257
- "epoch": 9.0,
258
- "eval_accuracy": 0.8499844382197324,
259
- "eval_f1": 0.8496464092791962,
260
- "eval_loss": 0.6235840320587158,
261
- "eval_precision": 0.8498702852768623,
262
- "eval_recall": 0.8499844382197324,
263
- "eval_runtime": 15.7802,
264
- "eval_samples_per_second": 203.61,
265
- "eval_steps_per_second": 25.475,
266
- "step": 12672
267
- }
268
- ],
269
- "max_steps": 42240,
270
- "num_train_epochs": 30,
271
- "total_flos": 3931395111413520.0,
272
- "trial_name": null,
273
- "trial_params": null
274
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c07d398af21a16d9c74ceca38be74c689e7fefb963b4f8da37b6c49e55121eea
3
- size 3631
 
 
 
 
last-checkpoint/vocab.txt DELETED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea0028124c16c42b0173d84c15dfc6aaf99389e964846d869e1df752e59e8dec
3
  size 435769709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cc09466df4f7451ec73c9e2f59c8ca058f7d217f855947f6d8de3558d655167
3
  size 435769709