radic2682 commited on
Commit
6c5ab83
1 Parent(s): 84c4875

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ eval_nbest_predictions.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -3,6 +3,8 @@ license: apache-2.0
3
  base_model: google/bigbird-roberta-base
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: bigBird-base-fine-tuning-squad-B16R3-nobias
8
  results: []
@@ -13,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # bigBird-base-fine-tuning-squad-B16R3-nobias
15
 
16
- This model is a fine-tuned version of [google/bigbird-roberta-base](https://huggingface.co/google/bigbird-roberta-base) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
3
  base_model: google/bigbird-roberta-base
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - squad
8
  model-index:
9
  - name: bigBird-base-fine-tuning-squad-B16R3-nobias
10
  results: []
 
15
 
16
  # bigBird-base-fine-tuning-squad-B16R3-nobias
17
 
18
+ This model is a fine-tuned version of [google/bigbird-roberta-base](https://huggingface.co/google/bigbird-roberta-base) on the squad dataset.
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "epoch": 2.0,
3
- "eval_exact_match": 89.84375,
4
- "eval_f1": 91.5327380952381,
5
  "eval_model_preparation_time": 0.0018,
6
- "eval_runtime": 9.9215,
7
- "eval_samples": 128,
8
- "eval_samples_per_second": 12.901,
9
- "eval_steps_per_second": 0.101,
10
- "total_flos": 3.864501390676132e+17,
11
- "train_loss": 0.05644623499482734,
12
- "train_runtime": 4615.1991,
13
  "train_samples": 87599,
14
- "train_samples_per_second": 37.961,
15
- "train_steps_per_second": 9.49
16
  }
 
1
  {
2
  "epoch": 2.0,
3
+ "eval_exact_match": 82.32734153263955,
4
+ "eval_f1": 89.22304303329197,
5
  "eval_model_preparation_time": 0.0018,
6
+ "eval_runtime": 834.3564,
7
+ "eval_samples": 10570,
8
+ "eval_samples_per_second": 12.668,
9
+ "eval_steps_per_second": 1.584,
10
+ "total_flos": 3.8619551920019866e+17,
11
+ "train_loss": 0.9270246051109,
12
+ "train_runtime": 51747.0424,
13
  "train_samples": 87599,
14
+ "train_samples_per_second": 3.386,
15
+ "train_steps_per_second": 0.423
16
  }
eval_nbest_predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
eval_predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "eval_exact_match": 89.84375,
3
- "eval_f1": 91.5327380952381,
4
- "eval_model_preparation_time": 0.0018,
5
- "eval_runtime": 9.9215,
6
- "eval_samples": 128,
7
- "eval_samples_per_second": 12.901,
8
- "eval_steps_per_second": 0.101
9
  }
 
1
  {
2
+ "epoch": 2.0,
3
+ "eval_exact_match": 82.32734153263955,
4
+ "eval_f1": 89.22304303329197,
5
+ "eval_runtime": 834.3564,
6
+ "eval_samples": 10570,
7
+ "eval_samples_per_second": 12.668,
8
+ "eval_steps_per_second": 1.584
9
  }
log/events.out.tfevents.1723149965.isl-gpu4.878776.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2f168d79fce90aba6e5b265cb4c52505c77107245cada8e9c987c5d1d9529e5
3
+ size 418
log/events.out.tfevents.1723149965.isl-gpu4.878776.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b008e94da6b7c8aeb7de0468302961370fad647060c22a4453c5e5eddf6e9cf
3
+ size 418
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 2.0,
3
- "total_flos": 3.864501390676132e+17,
4
- "train_loss": 0.05644623499482734,
5
- "train_runtime": 4615.1991,
6
  "train_samples": 87599,
7
- "train_samples_per_second": 37.961,
8
- "train_steps_per_second": 9.49
9
  }
 
1
  {
2
  "epoch": 2.0,
3
+ "total_flos": 3.8619551920019866e+17,
4
+ "train_loss": 0.9270246051109,
5
+ "train_runtime": 51747.0424,
6
  "train_samples": 87599,
7
+ "train_samples_per_second": 3.386,
8
+ "train_steps_per_second": 0.423
9
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff