CesarLeblanc commited on
Commit
01734ca
·
verified ·
1 Parent(s): 713d15a

Model save

Browse files
Files changed (4) hide show
  1. README.md +9 -9
  2. config.json +4 -4
  3. model.safetensors +2 -2
  4. training_args.bin +1 -1
README.md CHANGED
@@ -15,8 +15,8 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model was trained from scratch on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 1.9785
19
- - Accuracy: 0.4472
20
 
21
  ## Model description
22
 
@@ -36,8 +36,8 @@ More information needed
36
 
37
  The following hyperparameters were used during training:
38
  - learning_rate: 5e-05
39
- - train_batch_size: 8
40
- - eval_batch_size: 8
41
  - seed: 123
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: linear
@@ -48,11 +48,11 @@ The following hyperparameters were used during training:
48
 
49
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
50
  |:-------------:|:-----:|:------:|:---------------:|:--------:|
51
- | 2.0838 | 1.0 | 34200 | 2.1737 | 0.4064 |
52
- | 1.8703 | 2.0 | 68400 | 2.0177 | 0.4362 |
53
- | 1.8733 | 3.0 | 102600 | 1.9902 | 0.4368 |
54
- | 1.6634 | 4.0 | 136800 | 1.9717 | 0.4455 |
55
- | 1.6316 | 5.0 | 171000 | 1.9785 | 0.4472 |
56
 
57
 
58
  ### Framework versions
 
15
 
16
  This model was trained from scratch on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 4.2249
19
+ - Accuracy: 0.0948
20
 
21
  ## Model description
22
 
 
36
 
37
  The following hyperparameters were used during training:
38
  - learning_rate: 5e-05
39
+ - train_batch_size: 4
40
+ - eval_batch_size: 4
41
  - seed: 123
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: linear
 
48
 
49
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
50
  |:-------------:|:-----:|:------:|:---------------:|:--------:|
51
+ | 4.1776 | 1.0 | 68400 | 4.2204 | 0.0948 |
52
+ | 4.2058 | 2.0 | 136800 | 4.2118 | 0.0948 |
53
+ | 4.1949 | 3.0 | 205200 | 4.2219 | 0.0948 |
54
+ | 4.1297 | 4.0 | 273600 | 4.2298 | 0.0948 |
55
+ | 4.2056 | 5.0 | 342000 | 4.2249 | 0.0948 |
56
 
57
 
58
  ### Framework versions
config.json CHANGED
@@ -8,7 +8,7 @@
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "id2label": {
13
  "0": "LABEL_0",
14
  "1": "LABEL_1",
@@ -212,7 +212,7 @@
212
  "199": "LABEL_199"
213
  },
214
  "initializer_range": 0.02,
215
- "intermediate_size": 3072,
216
  "label2id": {
217
  "LABEL_0": 0,
218
  "LABEL_1": 1,
@@ -418,8 +418,8 @@
418
  "layer_norm_eps": 1e-12,
419
  "max_position_embeddings": 512,
420
  "model_type": "bert",
421
- "num_attention_heads": 12,
422
- "num_hidden_layers": 12,
423
  "pad_token_id": 0,
424
  "position_embedding_type": "absolute",
425
  "problem_type": "single_label_classification",
 
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
  "id2label": {
13
  "0": "LABEL_0",
14
  "1": "LABEL_1",
 
212
  "199": "LABEL_199"
213
  },
214
  "initializer_range": 0.02,
215
+ "intermediate_size": 4096,
216
  "label2id": {
217
  "LABEL_0": 0,
218
  "LABEL_1": 1,
 
418
  "layer_norm_eps": 1e-12,
419
  "max_position_embeddings": 512,
420
  "model_type": "bert",
421
+ "num_attention_heads": 16,
422
+ "num_hidden_layers": 24,
423
  "pad_token_id": 0,
424
  "position_embedding_type": "absolute",
425
  "problem_type": "single_label_classification",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c5ae12f57547f1a771d7d67e797e2af145391866394d8dfa8168a08f8fe1691
3
- size 473551648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c7d0048dc65573b7291b2036889f6e18b0345c3c3111fff8eec59693017cdec
3
+ size 1388079840
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd41aa8a858ba1c9475c1b00f49df12f3c431f5e41d29eed4d95382544c7d510
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51e423a43e2c343212f9e7679f0b3d1aff9fe7a7b292399f81c25b5157e5e97d
3
  size 4664