Shresthadev403 commited on
Commit
ba79768
1 Parent(s): 3d58b30

End of training

Browse files
README.md CHANGED
@@ -14,6 +14,8 @@ should probably proofread and complete it, then remove this comment. -->
14
  # bert-base-banking77-pt2
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
 
 
17
 
18
  ## Model description
19
 
@@ -40,7 +42,7 @@ The following hyperparameters were used during training:
40
  - total_train_batch_size: 640
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 7
44
 
45
  ### Training results
46
 
 
14
  # bert-base-banking77-pt2
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
17
+ It achieves the following results on the evaluation set:
18
+ - Loss: 6.2882
19
 
20
  ## Model description
21
 
 
42
  - total_train_batch_size: 640
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
+ - num_epochs: 10
46
 
47
  ### Training results
48
 
logs/events.out.tfevents.1702227000.07df5a8b60a1.2585.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3fd0f274d60d2b02e3f867847b550b0b73ce4905bf94570b51a2f06fe209739
3
+ size 5224
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbdf21c65e42ecf425af13ee6cb1bc584fb68ab844200b542e0174b7ee5e4cb4
3
  size 497814144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6729e64018ebc5616c73c83749f191be7b30355301edcf01b4dc16b751c61810
3
  size 497814144
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 4.375,
5
  "eval_steps": 10,
6
- "global_step": 7,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -25,13 +25,36 @@
25
  "train_runtime": 0.0348,
26
  "train_samples_per_second": 201109.164,
27
  "train_steps_per_second": 201.109
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  }
29
  ],
30
  "logging_steps": 10,
31
- "max_steps": 7,
32
- "num_train_epochs": 7,
33
  "save_steps": 10,
34
- "total_flos": 286376067072000.0,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
1
  {
2
+ "best_metric": 6.288247108459473,
3
+ "best_model_checkpoint": "bert-base-banking77-pt2/checkpoint-10",
4
+ "epoch": 8.875,
5
  "eval_steps": 10,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
25
  "train_runtime": 0.0348,
26
  "train_samples_per_second": 201109.164,
27
  "train_steps_per_second": 201.109
28
+ },
29
+ {
30
+ "epoch": 8.88,
31
+ "learning_rate": 3.5e-05,
32
+ "loss": 7.1176,
33
+ "step": 10
34
+ },
35
+ {
36
+ "epoch": 8.88,
37
+ "eval_loss": 6.288247108459473,
38
+ "eval_runtime": 12.385,
39
+ "eval_samples_per_second": 80.743,
40
+ "eval_steps_per_second": 2.584,
41
+ "step": 10
42
+ },
43
+ {
44
+ "epoch": 8.88,
45
+ "step": 10,
46
+ "total_flos": 410228490240000.0,
47
+ "train_loss": 2.135270118713379,
48
+ "train_runtime": 92.0794,
49
+ "train_samples_per_second": 108.602,
50
+ "train_steps_per_second": 0.109
51
  }
52
  ],
53
  "logging_steps": 10,
54
+ "max_steps": 10,
55
+ "num_train_epochs": 10,
56
  "save_steps": 10,
57
+ "total_flos": 410228490240000.0,
58
  "trial_name": null,
59
  "trial_params": null
60
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3120a79b950bf9a79bef5fab066d940b2c8afce2622e34f82e0c5edb68126598
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd8fdabe3ce8b5faf7d270d98467375c27a1b24feaf5108409ab4e5f05f2e744
3
  size 4600