Francesco0101 commited on
Commit
38e9cff
1 Parent(s): 7f0f020

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distilbert-base-uncased",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
 
1
  {
2
+ "_name_or_path": "Francesco0101/FRABERT-distilbert-base-uncased-51086",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5f4f42ed8726a01ec1769407ef1ce59631c300e93dc2a837e341dffecd02c17
3
  size 267835644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9acbbe59cc669bdd8860b3794df868e64b8903a4b29ed3a4f9607ba004dcb07
3
  size 267835644
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:687fdb80383701a262471eb09c7d2a63664bc1c45e3e06d64da2b2d8a6f07348
3
  size 535733434
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af56ec53953a4ce58073c6101f5d14112919323e7ff06caab1a8bc1ef88a4714
3
  size 535733434
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5829fdfb8ea3cfd8973041e1f4b84b188f3f51504415d377549403e604291433
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdf0dc39fa720efae5c87e2de3716c48674926551f71a0ba6dd10c6c02d77977
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a69b3a106ff3c8a053e64914963cacbd3b7c2581f1211e4c028a3c55f28ee8e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de7e2d35d1ac9cba6b442f08642ba93349bda77fc797f94a4764ad943e52ad2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6955057953127977,
3
  "best_model_checkpoint": "training_dir/checkpoint-3193",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 9579,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -64,12 +64,31 @@
64
  "eval_samples_per_second": 82.493,
65
  "eval_steps_per_second": 10.312,
66
  "step": 9579
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 500,
70
- "max_steps": 19158,
71
  "num_input_tokens_seen": 0,
72
- "num_train_epochs": 6,
73
  "save_steps": 500,
74
  "stateful_callbacks": {
75
  "TrainerControl": {
@@ -83,7 +102,7 @@
83
  "attributes": {}
84
  }
85
  },
86
- "total_flos": 2.000505291334038e+16,
87
  "train_batch_size": 16,
88
  "trial_name": null,
89
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6955057953127977,
3
  "best_model_checkpoint": "training_dir/checkpoint-3193",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 12772,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
64
  "eval_samples_per_second": 82.493,
65
  "eval_steps_per_second": 10.312,
66
  "step": 9579
67
+ },
68
+ {
69
+ "epoch": 4.0,
70
+ "grad_norm": 7.0213212966918945,
71
+ "learning_rate": 6.0954502068087814e-05,
72
+ "loss": 0.2568,
73
+ "step": 12772
74
+ },
75
+ {
76
+ "epoch": 4.0,
77
+ "eval_accuracy": 0.6853146853146853,
78
+ "eval_f1": 0.6752368731633129,
79
+ "eval_loss": 1.3729437589645386,
80
+ "eval_precision": 0.6983670162522349,
81
+ "eval_recall": 0.6853146853146853,
82
+ "eval_runtime": 30.1468,
83
+ "eval_samples_per_second": 75.895,
84
+ "eval_steps_per_second": 9.487,
85
+ "step": 12772
86
  }
87
  ],
88
  "logging_steps": 500,
89
+ "max_steps": 31930,
90
  "num_input_tokens_seen": 0,
91
+ "num_train_epochs": 10,
92
  "save_steps": 500,
93
  "stateful_callbacks": {
94
  "TrainerControl": {
 
102
  "attributes": {}
103
  }
104
  },
105
+ "total_flos": 2.6676379106990172e+16,
106
  "train_batch_size": 16,
107
  "trial_name": null,
108
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adc25bad5e22cb00ec67cc5c6a1989c8fa44a7021556e9019cbdec8c4516a3cb
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb92a7fd44c3795edeffedfd95925fc357be78e9278a301e4f880ffc172a22b1
3
  size 5176