Rodrigo1771 commited on
Commit
889ed0e
1 Parent(s): c844b13

End of training

Browse files
README.md CHANGED
@@ -2,9 +2,10 @@
2
  license: apache-2.0
3
  base_model: PlanTL-GOB-ES/bsc-bio-ehr-es
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
- - combined-train-drugtemist-dev-ner
8
  metrics:
9
  - precision
10
  - recall
@@ -17,24 +18,24 @@ model-index:
17
  name: Token Classification
18
  type: token-classification
19
  dataset:
20
- name: combined-train-drugtemist-dev-ner
21
- type: combined-train-drugtemist-dev-ner
22
  config: CombinedTrainDrugTEMISTDevNER
23
  split: validation
24
  args: CombinedTrainDrugTEMISTDevNER
25
  metrics:
26
  - name: Precision
27
  type: precision
28
- value: 0.0914341567442687
29
  - name: Recall
30
  type: recall
31
- value: 0.9457720588235294
32
  - name: F1
33
  type: f1
34
- value: 0.16674769081186194
35
  - name: Accuracy
36
  type: accuracy
37
- value: 0.7820794485561674
38
  ---
39
 
40
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -42,13 +43,13 @@ should probably proofread and complete it, then remove this comment. -->
42
 
43
  # output
44
 
45
- This model is a fine-tuned version of [PlanTL-GOB-ES/bsc-bio-ehr-es](https://huggingface.co/PlanTL-GOB-ES/bsc-bio-ehr-es) on the combined-train-drugtemist-dev-ner dataset.
46
  It achieves the following results on the evaluation set:
47
- - Loss: 1.4862
48
- - Precision: 0.0914
49
- - Recall: 0.9458
50
- - F1: 0.1667
51
- - Accuracy: 0.7821
52
 
53
  ## Model description
54
 
 
2
  license: apache-2.0
3
  base_model: PlanTL-GOB-ES/bsc-bio-ehr-es
4
  tags:
5
+ - token-classification
6
  - generated_from_trainer
7
  datasets:
8
+ - Rodrigo1771/combined-train-drugtemist-dev-ner
9
  metrics:
10
  - precision
11
  - recall
 
18
  name: Token Classification
19
  type: token-classification
20
  dataset:
21
+ name: Rodrigo1771/combined-train-drugtemist-dev-ner
22
+ type: Rodrigo1771/combined-train-drugtemist-dev-ner
23
  config: CombinedTrainDrugTEMISTDevNER
24
  split: validation
25
  args: CombinedTrainDrugTEMISTDevNER
26
  metrics:
27
  - name: Precision
28
  type: precision
29
+ value: 0.09532555790247038
30
  - name: Recall
31
  type: recall
32
+ value: 0.9540441176470589
33
  - name: F1
34
  type: f1
35
+ value: 0.17333222008850296
36
  - name: Accuracy
37
  type: accuracy
38
+ value: 0.7932840841995413
39
  ---
40
 
41
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
43
 
44
  # output
45
 
46
+ This model is a fine-tuned version of [PlanTL-GOB-ES/bsc-bio-ehr-es](https://huggingface.co/PlanTL-GOB-ES/bsc-bio-ehr-es) on the Rodrigo1771/combined-train-drugtemist-dev-ner dataset.
47
  It achieves the following results on the evaluation set:
48
+ - Loss: 1.0503
49
+ - Precision: 0.0953
50
+ - Recall: 0.9540
51
+ - F1: 0.1733
52
+ - Accuracy: 0.7933
53
 
54
  ## Model description
55
 
all_results.json CHANGED
@@ -1,26 +1,26 @@
1
  {
2
  "epoch": 9.988249118683902,
3
- "eval_accuracy": 0.8601754843670617,
4
- "eval_f1": 0.4624414693662204,
5
- "eval_loss": 0.6266195774078369,
6
- "eval_precision": 0.32197630636422075,
7
- "eval_recall": 0.8203088441740758,
8
- "eval_runtime": 14.995,
9
  "eval_samples": 6810,
10
- "eval_samples_per_second": 454.15,
11
- "eval_steps_per_second": 56.819,
12
- "predict_accuracy": 0.9510588123763138,
13
- "predict_f1": 0.6555634301913535,
14
- "predict_loss": 0.18893657624721527,
15
- "predict_precision": 0.5454009433962265,
16
- "predict_recall": 0.8214920071047958,
17
- "predict_runtime": 30.3218,
18
- "predict_samples_per_second": 481.964,
19
- "predict_steps_per_second": 60.254,
20
  "total_flos": 1.2649810588547778e+16,
21
  "train_loss": 0.10639642311544979,
22
- "train_runtime": 1205.6346,
23
  "train_samples": 27229,
24
- "train_samples_per_second": 225.848,
25
- "train_steps_per_second": 3.525
26
  }
 
1
  {
2
  "epoch": 9.988249118683902,
3
+ "eval_accuracy": 0.7932840841995413,
4
+ "eval_f1": 0.17333222008850296,
5
+ "eval_loss": 1.0502684116363525,
6
+ "eval_precision": 0.09532555790247038,
7
+ "eval_recall": 0.9540441176470589,
8
+ "eval_runtime": 14.6851,
9
  "eval_samples": 6810,
10
+ "eval_samples_per_second": 463.735,
11
+ "eval_steps_per_second": 58.018,
12
+ "predict_accuracy": 0.8808544760053879,
13
+ "predict_f1": 0.24078298623886968,
14
+ "predict_loss": 0.62894606590271,
15
+ "predict_precision": 0.1378032345013477,
16
+ "predict_recall": 0.9528246942341293,
17
+ "predict_runtime": 29.8715,
18
+ "predict_samples_per_second": 489.229,
19
+ "predict_steps_per_second": 61.162,
20
  "total_flos": 1.2649810588547778e+16,
21
  "train_loss": 0.10639642311544979,
22
+ "train_runtime": 1208.2019,
23
  "train_samples": 27229,
24
+ "train_samples_per_second": 225.368,
25
+ "train_steps_per_second": 3.518
26
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 9.988249118683902,
3
- "eval_accuracy": 0.8601754843670617,
4
- "eval_f1": 0.4624414693662204,
5
- "eval_loss": 0.6266195774078369,
6
- "eval_precision": 0.32197630636422075,
7
- "eval_recall": 0.8203088441740758,
8
- "eval_runtime": 14.995,
9
  "eval_samples": 6810,
10
- "eval_samples_per_second": 454.15,
11
- "eval_steps_per_second": 56.819
12
  }
 
1
  {
2
  "epoch": 9.988249118683902,
3
+ "eval_accuracy": 0.7932840841995413,
4
+ "eval_f1": 0.17333222008850296,
5
+ "eval_loss": 1.0502684116363525,
6
+ "eval_precision": 0.09532555790247038,
7
+ "eval_recall": 0.9540441176470589,
8
+ "eval_runtime": 14.6851,
9
  "eval_samples": 6810,
10
+ "eval_samples_per_second": 463.735,
11
+ "eval_steps_per_second": 58.018
12
  }
predict_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "predict_accuracy": 0.9510588123763138,
3
- "predict_f1": 0.6555634301913535,
4
- "predict_loss": 0.18893657624721527,
5
- "predict_precision": 0.5454009433962265,
6
- "predict_recall": 0.8214920071047958,
7
- "predict_runtime": 30.3218,
8
- "predict_samples_per_second": 481.964,
9
- "predict_steps_per_second": 60.254
10
  }
 
1
  {
2
+ "predict_accuracy": 0.8808544760053879,
3
+ "predict_f1": 0.24078298623886968,
4
+ "predict_loss": 0.62894606590271,
5
+ "predict_precision": 0.1378032345013477,
6
+ "predict_recall": 0.9528246942341293,
7
+ "predict_runtime": 29.8715,
8
+ "predict_samples_per_second": 489.229,
9
+ "predict_steps_per_second": 61.162
10
  }
tb/events.out.tfevents.1725049039.6b97e535edda.13440.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f105690f828d701992cc9bf50b2d6c540b9476f5cd4584b9d782e2db879b27e7
3
+ size 560
train.log CHANGED
@@ -1553,3 +1553,53 @@ Training completed. Do not forget to share your model on huggingface.co/models =
1553
  {'eval_loss': 1.4861844778060913, 'eval_precision': 0.0914341567442687, 'eval_recall': 0.9457720588235294, 'eval_f1': 0.16674769081186194, 'eval_accuracy': 0.7820794485561674, 'eval_runtime': 15.3988, 'eval_samples_per_second': 442.243, 'eval_steps_per_second': 55.329, 'epoch': 9.99}
1554
  {'train_runtime': 1208.2019, 'train_samples_per_second': 225.368, 'train_steps_per_second': 3.518, 'train_loss': 0.10639642311544979, 'epoch': 9.99}
1555
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1556
  0%| | 0/852 [00:00<?, ?it/s]
1557
  1%| | 10/852 [00:00<00:09, 90.08it/s]
1558
  2%|▏ | 20/852 [00:00<00:10, 78.76it/s]
1559
  3%|▎ | 28/852 [00:00<00:10, 78.02it/s]
1560
  4%|▍ | 36/852 [00:00<00:10, 78.47it/s]
1561
  5%|▌ | 44/852 [00:00<00:10, 78.61it/s]
1562
  6%|▌ | 53/852 [00:00<00:10, 79.34it/s]
1563
  7%|▋ | 62/852 [00:00<00:09, 79.85it/s]
1564
  8%|▊ | 70/852 [00:00<00:10, 77.38it/s]
1565
  9%|▉ | 78/852 [00:00<00:09, 78.05it/s]
1566
  10%|█ | 86/852 [00:01<00:09, 77.50it/s]
1567
  11%|█ | 94/852 [00:01<00:09, 76.16it/s]
1568
  12%|█▏ | 103/852 [00:01<00:09, 77.40it/s]
1569
  13%|█▎ | 111/852 [00:01<00:09, 77.04it/s]
1570
  14%|█▍ | 119/852 [00:01<00:09, 77.45it/s]
1571
  15%|█▍ | 127/852 [00:01<00:09, 74.43it/s]
1572
  16%|█▌ | 135/852 [00:01<00:09, 75.89it/s]
1573
  17%|█▋ | 143/852 [00:01<00:09, 76.32it/s]
1574
  18%|█▊ | 151/852 [00:01<00:09, 75.91it/s]
1575
  19%|█▉ | 160/852 [00:02<00:08, 78.09it/s]
1576
  20%|█▉ | 168/852 [00:02<00:08, 78.48it/s]
1577
  21%|██ | 176/852 [00:02<00:08, 78.21it/s]
1578
  22%|██▏ | 184/852 [00:02<00:08, 78.18it/s]
1579
  23%|██▎ | 192/852 [00:02<00:08, 78.36it/s]
1580
  24%|██▎ | 201/852 [00:02<00:08, 79.00it/s]
1581
  25%|██▍ | 209/852 [00:02<00:08, 76.98it/s]
1582
  25%|██▌ | 217/852 [00:02<00:08, 77.31it/s]
1583
  26%|██▋ | 225/852 [00:02<00:08, 77.91it/s]
1584
  27%|██▋ | 234/852 [00:03<00:07, 78.41it/s]
1585
  28%|██▊ | 242/852 [00:03<00:08, 75.26it/s]
1586
  29%|██▉ | 250/852 [00:03<00:07, 76.11it/s]
1587
  30%|███ | 258/852 [00:03<00:07, 76.87it/s]
1588
  31%|███ | 266/852 [00:03<00:07, 77.23it/s]
1589
  32%|███▏ | 274/852 [00:03<00:07, 76.72it/s]
1590
  33%|███▎ | 283/852 [00:03<00:07, 77.64it/s]
1591
  34%|███▍ | 291/852 [00:03<00:07, 77.42it/s]
1592
  35%|███▌ | 300/852 [00:03<00:07, 78.54it/s]
1593
  36%|███▋ | 309/852 [00:03<00:06, 79.83it/s]
1594
  37%|███▋ | 317/852 [00:04<00:06, 77.81it/s]
1595
  38%|███▊ | 325/852 [00:04<00:06, 77.95it/s]
1596
  39%|███▉ | 333/852 [00:04<00:06, 77.82it/s]
1597
  40%|████ | 341/852 [00:04<00:06, 78.04it/s]
1598
  41%|████ | 349/852 [00:04<00:06, 77.95it/s]
1599
  42%|████▏ | 357/852 [00:04<00:06, 75.79it/s]
1600
  43%|████▎ | 366/852 [00:04<00:06, 76.55it/s]
1601
  44%|████▍ | 375/852 [00:04<00:06, 77.81it/s]
1602
  45%|████▍ | 383/852 [00:04<00:06, 76.63it/s]
1603
  46%|████▌ | 391/852 [00:05<00:05, 77.37it/s]
1604
  47%|████▋ | 399/852 [00:05<00:05, 77.36it/s]
1605
  48%|████▊ | 407/852 [00:05<00:05, 74.94it/s]
1606
  49%|████▊ | 415/852 [00:05<00:05, 75.29it/s]
1607
  50%|████▉ | 423/852 [00:05<00:05, 75.49it/s]
1608
  51%|█████ | 431/852 [00:05<00:05, 75.09it/s]
1609
  52%|█████▏ | 440/852 [00:05<00:05, 76.74it/s]
1610
  53%|█████▎ | 448/852 [00:05<00:05, 76.92it/s]
1611
  54%|█████▎ | 456/852 [00:05<00:05, 77.77it/s]
1612
  54%|█████▍ | 464/852 [00:05<00:05, 76.63it/s]
1613
  55%|█████▌ | 472/852 [00:06<00:05, 72.05it/s]
1614
  56%|█████▋ | 480/852 [00:06<00:05, 73.97it/s]
1615
  57%|█████▋ | 488/852 [00:06<00:04, 74.06it/s]
1616
  58%|█████▊ | 496/852 [00:06<00:04, 75.08it/s]
1617
  59%|█████▉ | 504/852 [00:06<00:04, 76.00it/s]
1618
  60%|██████ | 512/852 [00:06<00:04, 76.30it/s]
1619
  61%|██████ | 520/852 [00:06<00:04, 76.76it/s]
1620
  62%|██████▏ | 528/852 [00:06<00:04, 74.32it/s]
1621
  63%|██████▎ | 536/852 [00:06<00:04, 75.58it/s]
1622
  64%|██████▍ | 544/852 [00:07<00:04, 76.71it/s]
1623
  65%|██████▍ | 552/852 [00:07<00:04, 74.95it/s]
1624
  66%|██████▌ | 560/852 [00:07<00:03, 75.87it/s]
1625
  67%|██████▋ | 568/852 [00:07<00:03, 76.63it/s]
1626
  68%|██████▊ | 576/852 [00:07<00:03, 76.40it/s]
1627
  69%|██████▊ | 584/852 [00:07<00:03, 75.28it/s]
1628
  69%|██████▉ | 592/852 [00:07<00:03, 75.66it/s]
1629
  70%|███████ | 600/852 [00:07<00:03, 75.20it/s]
1630
  71%|███████▏ | 608/852 [00:07<00:03, 74.78it/s]
1631
  72%|███████▏ | 616/852 [00:08<00:03, 73.06it/s]
1632
  73%|███████▎ | 624/852 [00:08<00:03, 74.76it/s]
1633
  74%|███████▍ | 632/852 [00:08<00:03, 73.28it/s]
1634
  75%|███████▌ | 640/852 [00:08<00:02, 73.23it/s]
1635
  76%|███████▌ | 648/852 [00:08<00:02, 72.28it/s]
1636
  77%|███████▋ | 656/852 [00:08<00:02, 74.30it/s]
1637
  78%|███████▊ | 664/852 [00:08<00:02, 74.53it/s]
1638
  79%|███████▉ | 672/852 [00:08<00:02, 74.57it/s]
1639
  80%|███████▉ | 680/852 [00:08<00:02, 75.61it/s]
1640
  81%|████████ | 689/852 [00:08<00:02, 77.74it/s]
1641
  82%|████████▏ | 697/852 [00:09<00:02, 76.57it/s]
1642
  83%|████████▎ | 706/852 [00:09<00:01, 77.79it/s]
1643
  84%|████████▍ | 714/852 [00:09<00:01, 78.22it/s]
1644
  85%|████████▍ | 722/852 [00:09<00:01, 77.26it/s]
1645
  86%|████████▌ | 731/852 [00:09<00:01, 78.66it/s]
1646
  87%|████████▋ | 740/852 [00:09<00:01, 79.91it/s]
1647
  88%|████████▊ | 749/852 [00:09<00:01, 80.22it/s]
1648
  89%|████████▉ | 758/852 [00:09<00:01, 80.35it/s]
1649
  90%|█████████ | 767/852 [00:09<00:01, 79.25it/s]
1650
  91%|█████████ | 776/852 [00:10<00:00, 79.74it/s]
1651
  92%|█████████▏| 784/852 [00:10<00:00, 79.50it/s]
1652
  93%|█████████▎| 792/852 [00:10<00:00, 79.31it/s]
1653
  94%|█████████▍| 800/852 [00:10<00:00, 79.49it/s]
1654
  95%|█████████▍| 809/852 [00:10<00:00, 81.08it/s]
1655
  96%|█████████▌| 818/852 [00:10<00:00, 79.55it/s]
1656
  97%|█████████▋| 827/852 [00:10<00:00, 81.06it/s]
1657
  98%|█████████▊| 836/852 [00:10<00:00, 81.02it/s]
1658
  99%|█████████▉| 845/852 [00:10<00:00, 79.78it/s]/usr/local/lib/python3.10/dist-packages/seqeval/metrics/v1.py:57: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples. Use `zero_division` parameter to control this behavior.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1659
  0%| | 0/1827 [00:00<?, ?it/s]
1660
  1%| | 10/1827 [00:00<00:20, 87.94it/s]
1661
  1%| | 19/1827 [00:00<00:22, 79.79it/s]
1662
  1%|▏ | 27/1827 [00:00<00:22, 79.33it/s]
1663
  2%|▏ | 35/1827 [00:00<00:22, 78.11it/s]
1664
  2%|▏ | 44/1827 [00:00<00:22, 80.08it/s]
1665
  3%|▎ | 53/1827 [00:00<00:22, 79.80it/s]
1666
  3%|▎ | 61/1827 [00:00<00:22, 77.38it/s]
1667
  4%|▍ | 70/1827 [00:00<00:22, 77.96it/s]
1668
  4%|▍ | 79/1827 [00:00<00:21, 80.62it/s]
1669
  5%|▍ | 88/1827 [00:01<00:21, 79.62it/s]
1670
  5%|▌ | 97/1827 [00:01<00:21, 81.19it/s]
1671
  6%|▌ | 106/1827 [00:01<00:20, 82.65it/s]
1672
  6%|▋ | 115/1827 [00:01<00:20, 82.97it/s]
1673
  7%|▋ | 124/1827 [00:01<00:21, 79.65it/s]
1674
  7%|▋ | 133/1827 [00:01<00:21, 79.51it/s]
1675
  8%|▊ | 142/1827 [00:01<00:20, 80.61it/s]
1676
  8%|▊ | 151/1827 [00:01<00:20, 81.06it/s]
1677
  9%|▉ | 160/1827 [00:02<00:21, 77.41it/s]
1678
  9%|▉ | 169/1827 [00:02<00:21, 78.59it/s]
1679
  10%|▉ | 178/1827 [00:02<00:20, 79.54it/s]
1680
  10%|█ | 187/1827 [00:02<00:20, 80.64it/s]
1681
  11%|█ | 196/1827 [00:02<00:20, 80.28it/s]
1682
  11%|█ | 205/1827 [00:02<00:20, 79.31it/s]
1683
  12%|█▏ | 213/1827 [00:02<00:20, 78.96it/s]
1684
  12%|█▏ | 222/1827 [00:02<00:20, 79.52it/s]
1685
  13%|█▎ | 230/1827 [00:02<00:20, 78.22it/s]
1686
  13%|█▎ | 238/1827 [00:02<00:20, 76.49it/s]
1687
  14%|█▎ | 247/1827 [00:03<00:20, 78.15it/s]
1688
  14%|█▍ | 256/1827 [00:03<00:19, 79.26it/s]
1689
  14%|█▍ | 264/1827 [00:03<00:20, 77.90it/s]
1690
  15%|█▍ | 273/1827 [00:03<00:19, 80.06it/s]
1691
  15%|█▌ | 282/1827 [00:03<00:19, 81.15it/s]
1692
  16%|█▌ | 291/1827 [00:03<00:19, 80.73it/s]
1693
  16%|█▋ | 300/1827 [00:03<00:18, 81.69it/s]
1694
  17%|█▋ | 309/1827 [00:03<00:18, 80.77it/s]
1695
  17%|█▋ | 318/1827 [00:03<00:18, 80.07it/s]
1696
  18%|█▊ | 327/1827 [00:04<00:18, 81.60it/s]
1697
  18%|█▊ | 336/1827 [00:04<00:18, 80.47it/s]
1698
  19%|█▉ | 345/1827 [00:04<00:18, 81.57it/s]
1699
  19%|█▉ | 354/1827 [00:04<00:19, 76.57it/s]
1700
  20%|█▉ | 362/1827 [00:04<00:19, 76.83it/s]
1701
  20%|██ | 370/1827 [00:04<00:18, 77.31it/s]
1702
  21%|██ | 378/1827 [00:04<00:18, 77.60it/s]
1703
  21%|██ | 386/1827 [00:04<00:18, 77.53it/s]
1704
  22%|██▏ | 394/1827 [00:04<00:18, 77.31it/s]
1705
  22%|██▏ | 402/1827 [00:05<00:18, 77.04it/s]
1706
  22%|██▏ | 410/1827 [00:05<00:18, 77.21it/s]
1707
  23%|██▎ | 418/1827 [00:05<00:18, 74.60it/s]
1708
  23%|██▎ | 426/1827 [00:05<00:18, 75.34it/s]
1709
  24%|██▍ | 434/1827 [00:05<00:18, 75.76it/s]
1710
  24%|██▍ | 442/1827 [00:05<00:18, 75.30it/s]
1711
  25%|██▍ | 450/1827 [00:05<00:18, 76.15it/s]
1712
  25%|██▌ | 459/1827 [00:05<00:17, 77.96it/s]
1713
  26%|██▌ | 468/1827 [00:05<00:17, 78.69it/s]
1714
  26%|██▌ | 476/1827 [00:06<00:17, 77.24it/s]
1715
  26%|██▋ | 484/1827 [00:06<00:17, 77.34it/s]
1716
  27%|██▋ | 492/1827 [00:06<00:17, 76.12it/s]
1717
  27%|██▋ | 500/1827 [00:06<00:17, 77.21it/s]
1718
  28%|██▊ | 508/1827 [00:06<00:16, 77.99it/s]
1719
  28%|██▊ | 517/1827 [00:06<00:16, 78.96it/s]
1720
  29%|██▉ | 526/1827 [00:06<00:16, 80.10it/s]
1721
  29%|██▉ | 535/1827 [00:06<00:16, 78.94it/s]
1722
  30%|██▉ | 544/1827 [00:06<00:16, 79.81it/s]
1723
  30%|███ | 552/1827 [00:06<00:16, 79.35it/s]
1724
  31%|███ | 560/1827 [00:07<00:15, 79.45it/s]
1725
  31%|███ | 569/1827 [00:07<00:15, 80.99it/s]
1726
  32%|███▏ | 578/1827 [00:07<00:15, 81.34it/s]
1727
  32%|███▏ | 587/1827 [00:07<00:15, 80.67it/s]
1728
  33%|███▎ | 596/1827 [00:07<00:15, 80.51it/s]
1729
  33%|███▎ | 605/1827 [00:07<00:15, 80.13it/s]
1730
  34%|███▎ | 614/1827 [00:07<00:15, 79.68it/s]
1731
  34%|███▍ | 623/1827 [00:07<00:15, 80.12it/s]
1732
  35%|███▍ | 632/1827 [00:07<00:14, 81.44it/s]
1733
  35%|███▌ | 641/1827 [00:08<00:14, 82.11it/s]
1734
  36%|███▌ | 650/1827 [00:08<00:15, 76.75it/s]
1735
  36%|███▌ | 658/1827 [00:08<00:15, 76.92it/s]
1736
  37%|███▋ | 667/1827 [00:08<00:14, 78.89it/s]
1737
  37%|███▋ | 675/1827 [00:08<00:14, 78.89it/s]
1738
  37%|███▋ | 684/1827 [00:08<00:14, 79.53it/s]
1739
  38%|███▊ | 693/1827 [00:08<00:14, 80.94it/s]
1740
  38%|███▊ | 702/1827 [00:08<00:14, 79.96it/s]
1741
  39%|███▉ | 711/1827 [00:08<00:13, 80.90it/s]
1742
  39%|███▉ | 720/1827 [00:09<00:13, 81.50it/s]
1743
  40%|███▉ | 729/1827 [00:09<00:13, 81.53it/s]
1744
  40%|████ | 738/1827 [00:09<00:13, 80.96it/s]
1745
  41%|████ | 747/1827 [00:09<00:13, 80.92it/s]
1746
  41%|████▏ | 756/1827 [00:09<00:13, 81.00it/s]
1747
  42%|████▏ | 765/1827 [00:09<00:13, 80.78it/s]
1748
  42%|████▏ | 774/1827 [00:09<00:13, 80.77it/s]
1749
  43%|████▎ | 783/1827 [00:09<00:13, 78.74it/s]
1750
  43%|████▎ | 792/1827 [00:09<00:13, 79.23it/s]
1751
  44%|████▍ | 800/1827 [00:10<00:13, 78.17it/s]
1752
  44%|████▍ | 809/1827 [00:10<00:12, 79.00it/s]
1753
  45%|████▍ | 818/1827 [00:10<00:12, 79.52it/s]
1754
  45%|████▌ | 827/1827 [00:10<00:12, 80.48it/s]
1755
  46%|████▌ | 836/1827 [00:10<00:12, 78.98it/s]
1756
  46%|████▋ | 845/1827 [00:10<00:12, 80.14it/s]
1757
  47%|████▋ | 854/1827 [00:10<00:12, 80.46it/s]
1758
  47%|████▋ | 863/1827 [00:10<00:11, 81.18it/s]
1759
  48%|████▊ | 872/1827 [00:10<00:11, 81.19it/s]
1760
  48%|████▊ | 881/1827 [00:11<00:11, 80.98it/s]
1761
  49%|████▊ | 890/1827 [00:11<00:11, 81.37it/s]
1762
  49%|████▉ | 899/1827 [00:11<00:11, 81.91it/s]
1763
  50%|████▉ | 908/1827 [00:11<00:11, 81.97it/s]
1764
  50%|█████ | 917/1827 [00:11<00:11, 82.23it/s]
1765
  51%|█████ | 926/1827 [00:11<00:10, 82.15it/s]
1766
  51%|█████ | 935/1827 [00:11<00:11, 80.10it/s]
1767
  52%|█████▏ | 944/1827 [00:11<00:10, 80.66it/s]
1768
  52%|█████▏ | 953/1827 [00:11<00:11, 79.31it/s]
1769
  53%|█████▎ | 962/1827 [00:12<00:10, 79.70it/s]
1770
  53%|█████▎ | 971/1827 [00:12<00:10, 80.87it/s]
1771
  54%|█████▎ | 980/1827 [00:12<00:10, 79.74it/s]
1772
  54%|█████▍ | 989/1827 [00:12<00:10, 80.80it/s]
1773
  55%|█████▍ | 998/1827 [00:12<00:10, 80.66it/s]
1774
  55%|█████▌ | 1007/1827 [00:12<00:10, 79.92it/s]
1775
  56%|█████▌ | 1015/1827 [00:12<00:10, 79.86it/s]
1776
  56%|█████▌ | 1024/1827 [00:12<00:09, 80.72it/s]
1777
  57%|█████▋ | 1033/1827 [00:12<00:09, 81.65it/s]
1778
  57%|█████▋ | 1042/1827 [00:13<00:09, 79.17it/s]
1779
  58%|█████▊ | 1051/1827 [00:13<00:09, 79.75it/s]
1780
  58%|█████▊ | 1060/1827 [00:13<00:09, 80.06it/s]
1781
  59%|█████▊ | 1069/1827 [00:13<00:09, 79.66it/s]
1782
  59%|█████▉ | 1078/1827 [00:13<00:09, 80.33it/s]
1783
  59%|█████▉ | 1087/1827 [00:13<00:09, 80.70it/s]
1784
  60%|█████▉ | 1096/1827 [00:13<00:09, 80.82it/s]
1785
  60%|██████ | 1105/1827 [00:13<00:09, 79.90it/s]
1786
  61%|██████ | 1113/1827 [00:13<00:08, 79.37it/s]
1787
  61%|██████▏ | 1121/1827 [00:14<00:08, 78.82it/s]
1788
  62%|██████▏ | 1129/1827 [00:14<00:08, 78.74it/s]
1789
  62%|██████▏ | 1138/1827 [00:14<00:08, 79.54it/s]
1790
  63%|██████▎ | 1146/1827 [00:14<00:08, 79.64it/s]
1791
  63%|██████▎ | 1154/1827 [00:14<00:08, 78.95it/s]
1792
  64%|██████▎ | 1162/1827 [00:14<00:08, 76.85it/s]
1793
  64%|██████▍ | 1170/1827 [00:14<00:08, 77.11it/s]
1794
  64%|██████▍ | 1178/1827 [00:14<00:08, 77.41it/s]
1795
  65%|██████▍ | 1186/1827 [00:14<00:08, 76.41it/s]
1796
  65%|██████▌ | 1195/1827 [00:15<00:08, 77.75it/s]
1797
  66%|██████▌ | 1203/1827 [00:15<00:07, 78.33it/s]
1798
  66%|██████▋ | 1211/1827 [00:15<00:07, 77.14it/s]
1799
  67%|██████▋ | 1219/1827 [00:15<00:08, 75.69it/s]
1800
  67%|██████▋ | 1227/1827 [00:15<00:07, 76.88it/s]
1801
  68%|██████▊ | 1235/1827 [00:15<00:07, 77.28it/s]
1802
  68%|██████▊ | 1243/1827 [00:15<00:07, 77.68it/s]
1803
  68%|██████▊ | 1251/1827 [00:15<00:07, 77.84it/s]
1804
  69%|██████▉ | 1259/1827 [00:15<00:07, 75.35it/s]
1805
  69%|██████▉ | 1267/1827 [00:15<00:07, 76.47it/s]
1806
  70%|██████▉ | 1276/1827 [00:16<00:07, 77.97it/s]
1807
  70%|███████ | 1284/1827 [00:16<00:06, 78.01it/s]
1808
  71%|███████ | 1292/1827 [00:16<00:06, 76.45it/s]
1809
  71%|███████ | 1300/1827 [00:16<00:06, 77.46it/s]
1810
  72%|███████▏ | 1308/1827 [00:16<00:06, 78.03it/s]
1811
  72%|███████▏ | 1316/1827 [00:16<00:06, 77.74it/s]
1812
  72%|███████▏ | 1324/1827 [00:16<00:06, 77.86it/s]
1813
  73%|███████▎ | 1332/1827 [00:16<00:06, 77.96it/s]
1814
  73%|███████▎ | 1340/1827 [00:16<00:06, 78.18it/s]
1815
  74%|███████▍ | 1348/1827 [00:17<00:06, 76.62it/s]
1816
  74%|███████▍ | 1356/1827 [00:17<00:06, 77.14it/s]
1817
  75%|███████▍ | 1364/1827 [00:17<00:05, 77.97it/s]
1818
  75%|███████▌ | 1372/1827 [00:17<00:05, 78.09it/s]
1819
  76%|███████▌ | 1381/1827 [00:17<00:05, 79.48it/s]
1820
  76%|███████▌ | 1389/1827 [00:17<00:05, 79.56it/s]
1821
  77%|███████▋ | 1398/1827 [00:17<00:05, 80.37it/s]
1822
  77%|███████▋ | 1407/1827 [00:17<00:05, 81.10it/s]
1823
  78%|███████▊ | 1416/1827 [00:17<00:05, 81.80it/s]
1824
  78%|███████▊ | 1425/1827 [00:17<00:04, 80.90it/s]
1825
  78%|███████▊ | 1434/1827 [00:18<00:04, 79.95it/s]
1826
  79%|███████▉ | 1442/1827 [00:18<00:04, 77.56it/s]
1827
  79%|███████▉ | 1450/1827 [00:18<00:04, 77.58it/s]
1828
  80%|███████▉ | 1459/1827 [00:18<00:04, 78.93it/s]
1829
  80%|████████ | 1468/1827 [00:18<00:04, 79.42it/s]
1830
  81%|████████ | 1476/1827 [00:18<00:04, 77.02it/s]
1831
  81%|████████ | 1484/1827 [00:18<00:04, 77.76it/s]
1832
  82%|████████▏ | 1492/1827 [00:18<00:04, 75.57it/s]
1833
  82%|████████▏ | 1500/1827 [00:18<00:04, 76.23it/s]
1834
  83%|████████▎ | 1508/1827 [00:19<00:04, 76.65it/s]
1835
  83%|████████▎ | 1517/1827 [00:19<00:03, 78.09it/s]
1836
  83%|████████▎ | 1525/1827 [00:19<00:03, 77.38it/s]
1837
  84%|████████▍ | 1534/1827 [00:19<00:03, 78.28it/s]
1838
  84%|████████▍ | 1542/1827 [00:19<00:03, 77.60it/s]
1839
  85%|████████▍ | 1550/1827 [00:19<00:03, 77.22it/s]
1840
  85%|████████▌ | 1558/1827 [00:19<00:03, 77.63it/s]
1841
  86%|████████▌ | 1566/1827 [00:19<00:03, 77.77it/s]
1842
  86%|████████▌ | 1574/1827 [00:19<00:03, 77.61it/s]
1843
  87%|████████▋ | 1583/1827 [00:20<00:03, 78.96it/s]
1844
  87%|████████▋ | 1591/1827 [00:20<00:02, 78.85it/s]
1845
  88%|████████▊ | 1599/1827 [00:20<00:02, 78.83it/s]
1846
  88%|████████▊ | 1608/1827 [00:20<00:02, 79.18it/s]
1847
  88%|████████▊ | 1616/1827 [00:20<00:02, 78.24it/s]
1848
  89%|████████▉ | 1624/1827 [00:20<00:02, 72.35it/s]
1849
  89%|████████▉ | 1632/1827 [00:20<00:02, 73.13it/s]
1850
  90%|████████▉ | 1640/1827 [00:20<00:02, 73.24it/s]
1851
  90%|█████████ | 1649/1827 [00:20<00:02, 75.71it/s]
1852
  91%|█████████ | 1658/1827 [00:21<00:02, 77.38it/s]
1853
  91%|█████████ | 1666/1827 [00:21<00:02, 77.89it/s]
1854
  92%|█████████▏| 1675/1827 [00:21<00:01, 79.27it/s]
1855
  92%|█████████▏| 1684/1827 [00:21<00:01, 80.75it/s]
1856
  93%|█████████▎| 1693/1827 [00:21<00:01, 79.27it/s]
1857
  93%|█████████▎| 1702/1827 [00:21<00:01, 79.89it/s]
1858
  94%|█████████▎| 1711/1827 [00:21<00:01, 80.41it/s]
1859
  94%|█████████▍| 1720/1827 [00:21<00:01, 77.30it/s]
1860
  95%|█████████▍| 1729/1827 [00:21<00:01, 78.18it/s]
1861
  95%|█████████▌| 1738/1827 [00:22<00:01, 79.15it/s]
1862
  96%|█████████▌| 1747/1827 [00:22<00:00, 80.30it/s]
1863
  96%|█████████▌| 1756/1827 [00:22<00:00, 79.63it/s]
1864
  97%|█████████▋| 1765/1827 [00:22<00:00, 80.54it/s]
1865
  97%|█████████▋| 1774/1827 [00:22<00:00, 80.33it/s]
1866
  98%|█████████▊| 1783/1827 [00:22<00:00, 81.23it/s]
1867
  98%|█████████▊| 1792/1827 [00:22<00:00, 80.70it/s]
1868
  99%|█████████▊| 1801/1827 [00:22<00:00, 77.42it/s]
1869
  99%|█████████▉| 1810/1827 [00:22<00:00, 78.66it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1553
  {'eval_loss': 1.4861844778060913, 'eval_precision': 0.0914341567442687, 'eval_recall': 0.9457720588235294, 'eval_f1': 0.16674769081186194, 'eval_accuracy': 0.7820794485561674, 'eval_runtime': 15.3988, 'eval_samples_per_second': 442.243, 'eval_steps_per_second': 55.329, 'epoch': 9.99}
1554
  {'train_runtime': 1208.2019, 'train_samples_per_second': 225.368, 'train_steps_per_second': 3.518, 'train_loss': 0.10639642311544979, 'epoch': 9.99}
1555
 
1556
+ ***** train metrics *****
1557
+ epoch = 9.9882
1558
+ total_flos = 11781054GF
1559
+ train_loss = 0.1064
1560
+ train_runtime = 0:20:08.20
1561
+ train_samples = 27229
1562
+ train_samples_per_second = 225.368
1563
+ train_steps_per_second = 3.518
1564
+ 08/30/2024 20:17:04 - INFO - __main__ - *** Evaluate ***
1565
+ [INFO|trainer.py:805] 2024-08-30 20:17:04,325 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: id, ner_tags, tokens. If id, ner_tags, tokens are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message.
1566
+ [INFO|trainer.py:3788] 2024-08-30 20:17:04,327 >>
1567
+ ***** Running Evaluation *****
1568
+ [INFO|trainer.py:3790] 2024-08-30 20:17:04,327 >> Num examples = 6810
1569
+ [INFO|trainer.py:3793] 2024-08-30 20:17:04,327 >> Batch size = 8
1570
+
1571
  0%| | 0/852 [00:00<?, ?it/s]
1572
  1%| | 10/852 [00:00<00:09, 90.08it/s]
1573
  2%|▏ | 20/852 [00:00<00:10, 78.76it/s]
1574
  3%|▎ | 28/852 [00:00<00:10, 78.02it/s]
1575
  4%|▍ | 36/852 [00:00<00:10, 78.47it/s]
1576
  5%|▌ | 44/852 [00:00<00:10, 78.61it/s]
1577
  6%|▌ | 53/852 [00:00<00:10, 79.34it/s]
1578
  7%|▋ | 62/852 [00:00<00:09, 79.85it/s]
1579
  8%|▊ | 70/852 [00:00<00:10, 77.38it/s]
1580
  9%|▉ | 78/852 [00:00<00:09, 78.05it/s]
1581
  10%|█ | 86/852 [00:01<00:09, 77.50it/s]
1582
  11%|█ | 94/852 [00:01<00:09, 76.16it/s]
1583
  12%|█▏ | 103/852 [00:01<00:09, 77.40it/s]
1584
  13%|█▎ | 111/852 [00:01<00:09, 77.04it/s]
1585
  14%|█▍ | 119/852 [00:01<00:09, 77.45it/s]
1586
  15%|█▍ | 127/852 [00:01<00:09, 74.43it/s]
1587
  16%|█▌ | 135/852 [00:01<00:09, 75.89it/s]
1588
  17%|█▋ | 143/852 [00:01<00:09, 76.32it/s]
1589
  18%|█▊ | 151/852 [00:01<00:09, 75.91it/s]
1590
  19%|█▉ | 160/852 [00:02<00:08, 78.09it/s]
1591
  20%|█▉ | 168/852 [00:02<00:08, 78.48it/s]
1592
  21%|██ | 176/852 [00:02<00:08, 78.21it/s]
1593
  22%|██▏ | 184/852 [00:02<00:08, 78.18it/s]
1594
  23%|██▎ | 192/852 [00:02<00:08, 78.36it/s]
1595
  24%|██▎ | 201/852 [00:02<00:08, 79.00it/s]
1596
  25%|██▍ | 209/852 [00:02<00:08, 76.98it/s]
1597
  25%|██▌ | 217/852 [00:02<00:08, 77.31it/s]
1598
  26%|██▋ | 225/852 [00:02<00:08, 77.91it/s]
1599
  27%|██▋ | 234/852 [00:03<00:07, 78.41it/s]
1600
  28%|██▊ | 242/852 [00:03<00:08, 75.26it/s]
1601
  29%|██▉ | 250/852 [00:03<00:07, 76.11it/s]
1602
  30%|███ | 258/852 [00:03<00:07, 76.87it/s]
1603
  31%|███ | 266/852 [00:03<00:07, 77.23it/s]
1604
  32%|███▏ | 274/852 [00:03<00:07, 76.72it/s]
1605
  33%|███▎ | 283/852 [00:03<00:07, 77.64it/s]
1606
  34%|███▍ | 291/852 [00:03<00:07, 77.42it/s]
1607
  35%|███▌ | 300/852 [00:03<00:07, 78.54it/s]
1608
  36%|███▋ | 309/852 [00:03<00:06, 79.83it/s]
1609
  37%|███▋ | 317/852 [00:04<00:06, 77.81it/s]
1610
  38%|███▊ | 325/852 [00:04<00:06, 77.95it/s]
1611
  39%|███▉ | 333/852 [00:04<00:06, 77.82it/s]
1612
  40%|████ | 341/852 [00:04<00:06, 78.04it/s]
1613
  41%|████ | 349/852 [00:04<00:06, 77.95it/s]
1614
  42%|████▏ | 357/852 [00:04<00:06, 75.79it/s]
1615
  43%|████▎ | 366/852 [00:04<00:06, 76.55it/s]
1616
  44%|████▍ | 375/852 [00:04<00:06, 77.81it/s]
1617
  45%|████▍ | 383/852 [00:04<00:06, 76.63it/s]
1618
  46%|████▌ | 391/852 [00:05<00:05, 77.37it/s]
1619
  47%|████▋ | 399/852 [00:05<00:05, 77.36it/s]
1620
  48%|████▊ | 407/852 [00:05<00:05, 74.94it/s]
1621
  49%|████▊ | 415/852 [00:05<00:05, 75.29it/s]
1622
  50%|████▉ | 423/852 [00:05<00:05, 75.49it/s]
1623
  51%|█████ | 431/852 [00:05<00:05, 75.09it/s]
1624
  52%|█████▏ | 440/852 [00:05<00:05, 76.74it/s]
1625
  53%|█████▎ | 448/852 [00:05<00:05, 76.92it/s]
1626
  54%|█████▎ | 456/852 [00:05<00:05, 77.77it/s]
1627
  54%|█████▍ | 464/852 [00:05<00:05, 76.63it/s]
1628
  55%|█████▌ | 472/852 [00:06<00:05, 72.05it/s]
1629
  56%|█████▋ | 480/852 [00:06<00:05, 73.97it/s]
1630
  57%|█████▋ | 488/852 [00:06<00:04, 74.06it/s]
1631
  58%|█████▊ | 496/852 [00:06<00:04, 75.08it/s]
1632
  59%|█████▉ | 504/852 [00:06<00:04, 76.00it/s]
1633
  60%|██████ | 512/852 [00:06<00:04, 76.30it/s]
1634
  61%|██████ | 520/852 [00:06<00:04, 76.76it/s]
1635
  62%|██████▏ | 528/852 [00:06<00:04, 74.32it/s]
1636
  63%|██████▎ | 536/852 [00:06<00:04, 75.58it/s]
1637
  64%|██████▍ | 544/852 [00:07<00:04, 76.71it/s]
1638
  65%|██████▍ | 552/852 [00:07<00:04, 74.95it/s]
1639
  66%|██████▌ | 560/852 [00:07<00:03, 75.87it/s]
1640
  67%|██████▋ | 568/852 [00:07<00:03, 76.63it/s]
1641
  68%|██████▊ | 576/852 [00:07<00:03, 76.40it/s]
1642
  69%|██████▊ | 584/852 [00:07<00:03, 75.28it/s]
1643
  69%|██████▉ | 592/852 [00:07<00:03, 75.66it/s]
1644
  70%|███████ | 600/852 [00:07<00:03, 75.20it/s]
1645
  71%|███████▏ | 608/852 [00:07<00:03, 74.78it/s]
1646
  72%|███████▏ | 616/852 [00:08<00:03, 73.06it/s]
1647
  73%|███████▎ | 624/852 [00:08<00:03, 74.76it/s]
1648
  74%|███████▍ | 632/852 [00:08<00:03, 73.28it/s]
1649
  75%|███████▌ | 640/852 [00:08<00:02, 73.23it/s]
1650
  76%|███████▌ | 648/852 [00:08<00:02, 72.28it/s]
1651
  77%|███████▋ | 656/852 [00:08<00:02, 74.30it/s]
1652
  78%|███████▊ | 664/852 [00:08<00:02, 74.53it/s]
1653
  79%|███████▉ | 672/852 [00:08<00:02, 74.57it/s]
1654
  80%|███████▉ | 680/852 [00:08<00:02, 75.61it/s]
1655
  81%|████████ | 689/852 [00:08<00:02, 77.74it/s]
1656
  82%|████████▏ | 697/852 [00:09<00:02, 76.57it/s]
1657
  83%|████████▎ | 706/852 [00:09<00:01, 77.79it/s]
1658
  84%|████████▍ | 714/852 [00:09<00:01, 78.22it/s]
1659
  85%|████████▍ | 722/852 [00:09<00:01, 77.26it/s]
1660
  86%|████████▌ | 731/852 [00:09<00:01, 78.66it/s]
1661
  87%|████████▋ | 740/852 [00:09<00:01, 79.91it/s]
1662
  88%|████████▊ | 749/852 [00:09<00:01, 80.22it/s]
1663
  89%|████████▉ | 758/852 [00:09<00:01, 80.35it/s]
1664
  90%|█████████ | 767/852 [00:09<00:01, 79.25it/s]
1665
  91%|█████████ | 776/852 [00:10<00:00, 79.74it/s]
1666
  92%|█████████▏| 784/852 [00:10<00:00, 79.50it/s]
1667
  93%|█████████▎| 792/852 [00:10<00:00, 79.31it/s]
1668
  94%|█████████▍| 800/852 [00:10<00:00, 79.49it/s]
1669
  95%|█████████▍| 809/852 [00:10<00:00, 81.08it/s]
1670
  96%|█████████▌| 818/852 [00:10<00:00, 79.55it/s]
1671
  97%|█████████▋| 827/852 [00:10<00:00, 81.06it/s]
1672
  98%|█████████▊| 836/852 [00:10<00:00, 81.02it/s]
1673
  99%|█████████▉| 845/852 [00:10<00:00, 79.78it/s]/usr/local/lib/python3.10/dist-packages/seqeval/metrics/v1.py:57: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples. Use `zero_division` parameter to control this behavior.
1674
+ _warn_prf(average, modifier, msg_start, len(result))
1675
+
1676
+ ***** eval metrics *****
1677
+ epoch = 9.9882
1678
+ eval_accuracy = 0.7933
1679
+ eval_f1 = 0.1733
1680
+ eval_loss = 1.0503
1681
+ eval_precision = 0.0953
1682
+ eval_recall = 0.954
1683
+ eval_runtime = 0:00:14.68
1684
+ eval_samples = 6810
1685
+ eval_samples_per_second = 463.735
1686
+ eval_steps_per_second = 58.018
1687
+ 08/30/2024 20:17:19 - INFO - __main__ - *** Predict ***
1688
+ [INFO|trainer.py:805] 2024-08-30 20:17:19,020 >> The following columns in the test set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: id, ner_tags, tokens. If id, ner_tags, tokens are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message.
1689
+ [INFO|trainer.py:3788] 2024-08-30 20:17:19,022 >>
1690
+ ***** Running Prediction *****
1691
+ [INFO|trainer.py:3790] 2024-08-30 20:17:19,022 >> Num examples = 14614
1692
+ [INFO|trainer.py:3793] 2024-08-30 20:17:19,023 >> Batch size = 8
1693
+
1694
  0%| | 0/1827 [00:00<?, ?it/s]
1695
  1%| | 10/1827 [00:00<00:20, 87.94it/s]
1696
  1%| | 19/1827 [00:00<00:22, 79.79it/s]
1697
  1%|▏ | 27/1827 [00:00<00:22, 79.33it/s]
1698
  2%|▏ | 35/1827 [00:00<00:22, 78.11it/s]
1699
  2%|▏ | 44/1827 [00:00<00:22, 80.08it/s]
1700
  3%|▎ | 53/1827 [00:00<00:22, 79.80it/s]
1701
  3%|▎ | 61/1827 [00:00<00:22, 77.38it/s]
1702
  4%|▍ | 70/1827 [00:00<00:22, 77.96it/s]
1703
  4%|▍ | 79/1827 [00:00<00:21, 80.62it/s]
1704
  5%|▍ | 88/1827 [00:01<00:21, 79.62it/s]
1705
  5%|▌ | 97/1827 [00:01<00:21, 81.19it/s]
1706
  6%|▌ | 106/1827 [00:01<00:20, 82.65it/s]
1707
  6%|▋ | 115/1827 [00:01<00:20, 82.97it/s]
1708
  7%|▋ | 124/1827 [00:01<00:21, 79.65it/s]
1709
  7%|▋ | 133/1827 [00:01<00:21, 79.51it/s]
1710
  8%|▊ | 142/1827 [00:01<00:20, 80.61it/s]
1711
  8%|▊ | 151/1827 [00:01<00:20, 81.06it/s]
1712
  9%|▉ | 160/1827 [00:02<00:21, 77.41it/s]
1713
  9%|▉ | 169/1827 [00:02<00:21, 78.59it/s]
1714
  10%|▉ | 178/1827 [00:02<00:20, 79.54it/s]
1715
  10%|█ | 187/1827 [00:02<00:20, 80.64it/s]
1716
  11%|█ | 196/1827 [00:02<00:20, 80.28it/s]
1717
  11%|█ | 205/1827 [00:02<00:20, 79.31it/s]
1718
  12%|█▏ | 213/1827 [00:02<00:20, 78.96it/s]
1719
  12%|█▏ | 222/1827 [00:02<00:20, 79.52it/s]
1720
  13%|█▎ | 230/1827 [00:02<00:20, 78.22it/s]
1721
  13%|█▎ | 238/1827 [00:02<00:20, 76.49it/s]
1722
  14%|█▎ | 247/1827 [00:03<00:20, 78.15it/s]
1723
  14%|█▍ | 256/1827 [00:03<00:19, 79.26it/s]
1724
  14%|█▍ | 264/1827 [00:03<00:20, 77.90it/s]
1725
  15%|█▍ | 273/1827 [00:03<00:19, 80.06it/s]
1726
  15%|█▌ | 282/1827 [00:03<00:19, 81.15it/s]
1727
  16%|█▌ | 291/1827 [00:03<00:19, 80.73it/s]
1728
  16%|█▋ | 300/1827 [00:03<00:18, 81.69it/s]
1729
  17%|█▋ | 309/1827 [00:03<00:18, 80.77it/s]
1730
  17%|█▋ | 318/1827 [00:03<00:18, 80.07it/s]
1731
  18%|█▊ | 327/1827 [00:04<00:18, 81.60it/s]
1732
  18%|█▊ | 336/1827 [00:04<00:18, 80.47it/s]
1733
  19%|█▉ | 345/1827 [00:04<00:18, 81.57it/s]
1734
  19%|█▉ | 354/1827 [00:04<00:19, 76.57it/s]
1735
  20%|█▉ | 362/1827 [00:04<00:19, 76.83it/s]
1736
  20%|██ | 370/1827 [00:04<00:18, 77.31it/s]
1737
  21%|██ | 378/1827 [00:04<00:18, 77.60it/s]
1738
  21%|██ | 386/1827 [00:04<00:18, 77.53it/s]
1739
  22%|██▏ | 394/1827 [00:04<00:18, 77.31it/s]
1740
  22%|██▏ | 402/1827 [00:05<00:18, 77.04it/s]
1741
  22%|██▏ | 410/1827 [00:05<00:18, 77.21it/s]
1742
  23%|██▎ | 418/1827 [00:05<00:18, 74.60it/s]
1743
  23%|██▎ | 426/1827 [00:05<00:18, 75.34it/s]
1744
  24%|██▍ | 434/1827 [00:05<00:18, 75.76it/s]
1745
  24%|██▍ | 442/1827 [00:05<00:18, 75.30it/s]
1746
  25%|██▍ | 450/1827 [00:05<00:18, 76.15it/s]
1747
  25%|██▌ | 459/1827 [00:05<00:17, 77.96it/s]
1748
  26%|██▌ | 468/1827 [00:05<00:17, 78.69it/s]
1749
  26%|██▌ | 476/1827 [00:06<00:17, 77.24it/s]
1750
  26%|██▋ | 484/1827 [00:06<00:17, 77.34it/s]
1751
  27%|██▋ | 492/1827 [00:06<00:17, 76.12it/s]
1752
  27%|██▋ | 500/1827 [00:06<00:17, 77.21it/s]
1753
  28%|██▊ | 508/1827 [00:06<00:16, 77.99it/s]
1754
  28%|██▊ | 517/1827 [00:06<00:16, 78.96it/s]
1755
  29%|██▉ | 526/1827 [00:06<00:16, 80.10it/s]
1756
  29%|██▉ | 535/1827 [00:06<00:16, 78.94it/s]
1757
  30%|██▉ | 544/1827 [00:06<00:16, 79.81it/s]
1758
  30%|███ | 552/1827 [00:06<00:16, 79.35it/s]
1759
  31%|███ | 560/1827 [00:07<00:15, 79.45it/s]
1760
  31%|███ | 569/1827 [00:07<00:15, 80.99it/s]
1761
  32%|███▏ | 578/1827 [00:07<00:15, 81.34it/s]
1762
  32%|███▏ | 587/1827 [00:07<00:15, 80.67it/s]
1763
  33%|███▎ | 596/1827 [00:07<00:15, 80.51it/s]
1764
  33%|███▎ | 605/1827 [00:07<00:15, 80.13it/s]
1765
  34%|███▎ | 614/1827 [00:07<00:15, 79.68it/s]
1766
  34%|███▍ | 623/1827 [00:07<00:15, 80.12it/s]
1767
  35%|███▍ | 632/1827 [00:07<00:14, 81.44it/s]
1768
  35%|███▌ | 641/1827 [00:08<00:14, 82.11it/s]
1769
  36%|███▌ | 650/1827 [00:08<00:15, 76.75it/s]
1770
  36%|███▌ | 658/1827 [00:08<00:15, 76.92it/s]
1771
  37%|███▋ | 667/1827 [00:08<00:14, 78.89it/s]
1772
  37%|███▋ | 675/1827 [00:08<00:14, 78.89it/s]
1773
  37%|███▋ | 684/1827 [00:08<00:14, 79.53it/s]
1774
  38%|███▊ | 693/1827 [00:08<00:14, 80.94it/s]
1775
  38%|███▊ | 702/1827 [00:08<00:14, 79.96it/s]
1776
  39%|███▉ | 711/1827 [00:08<00:13, 80.90it/s]
1777
  39%|███▉ | 720/1827 [00:09<00:13, 81.50it/s]
1778
  40%|███▉ | 729/1827 [00:09<00:13, 81.53it/s]
1779
  40%|████ | 738/1827 [00:09<00:13, 80.96it/s]
1780
  41%|████ | 747/1827 [00:09<00:13, 80.92it/s]
1781
  41%|████▏ | 756/1827 [00:09<00:13, 81.00it/s]
1782
  42%|████▏ | 765/1827 [00:09<00:13, 80.78it/s]
1783
  42%|████▏ | 774/1827 [00:09<00:13, 80.77it/s]
1784
  43%|████▎ | 783/1827 [00:09<00:13, 78.74it/s]
1785
  43%|████▎ | 792/1827 [00:09<00:13, 79.23it/s]
1786
  44%|████▍ | 800/1827 [00:10<00:13, 78.17it/s]
1787
  44%|████▍ | 809/1827 [00:10<00:12, 79.00it/s]
1788
  45%|████▍ | 818/1827 [00:10<00:12, 79.52it/s]
1789
  45%|████▌ | 827/1827 [00:10<00:12, 80.48it/s]
1790
  46%|████▌ | 836/1827 [00:10<00:12, 78.98it/s]
1791
  46%|████▋ | 845/1827 [00:10<00:12, 80.14it/s]
1792
  47%|████▋ | 854/1827 [00:10<00:12, 80.46it/s]
1793
  47%|████▋ | 863/1827 [00:10<00:11, 81.18it/s]
1794
  48%|████▊ | 872/1827 [00:10<00:11, 81.19it/s]
1795
  48%|████▊ | 881/1827 [00:11<00:11, 80.98it/s]
1796
  49%|████▊ | 890/1827 [00:11<00:11, 81.37it/s]
1797
  49%|████▉ | 899/1827 [00:11<00:11, 81.91it/s]
1798
  50%|████▉ | 908/1827 [00:11<00:11, 81.97it/s]
1799
  50%|█████ | 917/1827 [00:11<00:11, 82.23it/s]
1800
  51%|█████ | 926/1827 [00:11<00:10, 82.15it/s]
1801
  51%|█████ | 935/1827 [00:11<00:11, 80.10it/s]
1802
  52%|█████▏ | 944/1827 [00:11<00:10, 80.66it/s]
1803
  52%|█████▏ | 953/1827 [00:11<00:11, 79.31it/s]
1804
  53%|█████▎ | 962/1827 [00:12<00:10, 79.70it/s]
1805
  53%|█████▎ | 971/1827 [00:12<00:10, 80.87it/s]
1806
  54%|█████▎ | 980/1827 [00:12<00:10, 79.74it/s]
1807
  54%|█████▍ | 989/1827 [00:12<00:10, 80.80it/s]
1808
  55%|█████▍ | 998/1827 [00:12<00:10, 80.66it/s]
1809
  55%|█████▌ | 1007/1827 [00:12<00:10, 79.92it/s]
1810
  56%|█████▌ | 1015/1827 [00:12<00:10, 79.86it/s]
1811
  56%|█████▌ | 1024/1827 [00:12<00:09, 80.72it/s]
1812
  57%|█████▋ | 1033/1827 [00:12<00:09, 81.65it/s]
1813
  57%|█████▋ | 1042/1827 [00:13<00:09, 79.17it/s]
1814
  58%|█████▊ | 1051/1827 [00:13<00:09, 79.75it/s]
1815
  58%|█████▊ | 1060/1827 [00:13<00:09, 80.06it/s]
1816
  59%|█████▊ | 1069/1827 [00:13<00:09, 79.66it/s]
1817
  59%|█████▉ | 1078/1827 [00:13<00:09, 80.33it/s]
1818
  59%|█████▉ | 1087/1827 [00:13<00:09, 80.70it/s]
1819
  60%|█████▉ | 1096/1827 [00:13<00:09, 80.82it/s]
1820
  60%|██████ | 1105/1827 [00:13<00:09, 79.90it/s]
1821
  61%|██████ | 1113/1827 [00:13<00:08, 79.37it/s]
1822
  61%|██████▏ | 1121/1827 [00:14<00:08, 78.82it/s]
1823
  62%|██████▏ | 1129/1827 [00:14<00:08, 78.74it/s]
1824
  62%|██████▏ | 1138/1827 [00:14<00:08, 79.54it/s]
1825
  63%|██████▎ | 1146/1827 [00:14<00:08, 79.64it/s]
1826
  63%|██████▎ | 1154/1827 [00:14<00:08, 78.95it/s]
1827
  64%|██████▎ | 1162/1827 [00:14<00:08, 76.85it/s]
1828
  64%|██████▍ | 1170/1827 [00:14<00:08, 77.11it/s]
1829
  64%|██████▍ | 1178/1827 [00:14<00:08, 77.41it/s]
1830
  65%|██████▍ | 1186/1827 [00:14<00:08, 76.41it/s]
1831
  65%|██████▌ | 1195/1827 [00:15<00:08, 77.75it/s]
1832
  66%|██████▌ | 1203/1827 [00:15<00:07, 78.33it/s]
1833
  66%|██████▋ | 1211/1827 [00:15<00:07, 77.14it/s]
1834
  67%|██████▋ | 1219/1827 [00:15<00:08, 75.69it/s]
1835
  67%|██████▋ | 1227/1827 [00:15<00:07, 76.88it/s]
1836
  68%|██████▊ | 1235/1827 [00:15<00:07, 77.28it/s]
1837
  68%|██████▊ | 1243/1827 [00:15<00:07, 77.68it/s]
1838
  68%|██████▊ | 1251/1827 [00:15<00:07, 77.84it/s]
1839
  69%|██████▉ | 1259/1827 [00:15<00:07, 75.35it/s]
1840
  69%|██████▉ | 1267/1827 [00:15<00:07, 76.47it/s]
1841
  70%|██████▉ | 1276/1827 [00:16<00:07, 77.97it/s]
1842
  70%|███████ | 1284/1827 [00:16<00:06, 78.01it/s]
1843
  71%|███████ | 1292/1827 [00:16<00:06, 76.45it/s]
1844
  71%|███████ | 1300/1827 [00:16<00:06, 77.46it/s]
1845
  72%|███████▏ | 1308/1827 [00:16<00:06, 78.03it/s]
1846
  72%|███████▏ | 1316/1827 [00:16<00:06, 77.74it/s]
1847
  72%|███████▏ | 1324/1827 [00:16<00:06, 77.86it/s]
1848
  73%|███████▎ | 1332/1827 [00:16<00:06, 77.96it/s]
1849
  73%|███████▎ | 1340/1827 [00:16<00:06, 78.18it/s]
1850
  74%|███████▍ | 1348/1827 [00:17<00:06, 76.62it/s]
1851
  74%|███████▍ | 1356/1827 [00:17<00:06, 77.14it/s]
1852
  75%|███████▍ | 1364/1827 [00:17<00:05, 77.97it/s]
1853
  75%|███████▌ | 1372/1827 [00:17<00:05, 78.09it/s]
1854
  76%|███████▌ | 1381/1827 [00:17<00:05, 79.48it/s]
1855
  76%|███████▌ | 1389/1827 [00:17<00:05, 79.56it/s]
1856
  77%|███████▋ | 1398/1827 [00:17<00:05, 80.37it/s]
1857
  77%|███████▋ | 1407/1827 [00:17<00:05, 81.10it/s]
1858
  78%|███████▊ | 1416/1827 [00:17<00:05, 81.80it/s]
1859
  78%|███████▊ | 1425/1827 [00:17<00:04, 80.90it/s]
1860
  78%|███████▊ | 1434/1827 [00:18<00:04, 79.95it/s]
1861
  79%|███████▉ | 1442/1827 [00:18<00:04, 77.56it/s]
1862
  79%|███████▉ | 1450/1827 [00:18<00:04, 77.58it/s]
1863
  80%|███████▉ | 1459/1827 [00:18<00:04, 78.93it/s]
1864
  80%|████████ | 1468/1827 [00:18<00:04, 79.42it/s]
1865
  81%|████████ | 1476/1827 [00:18<00:04, 77.02it/s]
1866
  81%|████████ | 1484/1827 [00:18<00:04, 77.76it/s]
1867
  82%|████████▏ | 1492/1827 [00:18<00:04, 75.57it/s]
1868
  82%|████████▏ | 1500/1827 [00:18<00:04, 76.23it/s]
1869
  83%|████████▎ | 1508/1827 [00:19<00:04, 76.65it/s]
1870
  83%|████████▎ | 1517/1827 [00:19<00:03, 78.09it/s]
1871
  83%|████████▎ | 1525/1827 [00:19<00:03, 77.38it/s]
1872
  84%|████████▍ | 1534/1827 [00:19<00:03, 78.28it/s]
1873
  84%|████████▍ | 1542/1827 [00:19<00:03, 77.60it/s]
1874
  85%|████████▍ | 1550/1827 [00:19<00:03, 77.22it/s]
1875
  85%|████████▌ | 1558/1827 [00:19<00:03, 77.63it/s]
1876
  86%|████████▌ | 1566/1827 [00:19<00:03, 77.77it/s]
1877
  86%|████████▌ | 1574/1827 [00:19<00:03, 77.61it/s]
1878
  87%|████████▋ | 1583/1827 [00:20<00:03, 78.96it/s]
1879
  87%|████████▋ | 1591/1827 [00:20<00:02, 78.85it/s]
1880
  88%|████████▊ | 1599/1827 [00:20<00:02, 78.83it/s]
1881
  88%|████████▊ | 1608/1827 [00:20<00:02, 79.18it/s]
1882
  88%|████████▊ | 1616/1827 [00:20<00:02, 78.24it/s]
1883
  89%|████████▉ | 1624/1827 [00:20<00:02, 72.35it/s]
1884
  89%|████████▉ | 1632/1827 [00:20<00:02, 73.13it/s]
1885
  90%|████████▉ | 1640/1827 [00:20<00:02, 73.24it/s]
1886
  90%|█████████ | 1649/1827 [00:20<00:02, 75.71it/s]
1887
  91%|█████████ | 1658/1827 [00:21<00:02, 77.38it/s]
1888
  91%|█████████ | 1666/1827 [00:21<00:02, 77.89it/s]
1889
  92%|█████████▏| 1675/1827 [00:21<00:01, 79.27it/s]
1890
  92%|█████████▏| 1684/1827 [00:21<00:01, 80.75it/s]
1891
  93%|█████████▎| 1693/1827 [00:21<00:01, 79.27it/s]
1892
  93%|█████████▎| 1702/1827 [00:21<00:01, 79.89it/s]
1893
  94%|█████████▎| 1711/1827 [00:21<00:01, 80.41it/s]
1894
  94%|█████████▍| 1720/1827 [00:21<00:01, 77.30it/s]
1895
  95%|█████████▍| 1729/1827 [00:21<00:01, 78.18it/s]
1896
  95%|█████████▌| 1738/1827 [00:22<00:01, 79.15it/s]
1897
  96%|█████████▌| 1747/1827 [00:22<00:00, 80.30it/s]
1898
  96%|█████████▌| 1756/1827 [00:22<00:00, 79.63it/s]
1899
  97%|█████████▋| 1765/1827 [00:22<00:00, 80.54it/s]
1900
  97%|█████████▋| 1774/1827 [00:22<00:00, 80.33it/s]
1901
  98%|█████████▊| 1783/1827 [00:22<00:00, 81.23it/s]
1902
  98%|█████████▊| 1792/1827 [00:22<00:00, 80.70it/s]
1903
  99%|█████████▊| 1801/1827 [00:22<00:00, 77.42it/s]
1904
  99%|█████████▉| 1810/1827 [00:22<00:00, 78.66it/s]
1905
+ [INFO|trainer.py:3478] 2024-08-30 20:17:49,537 >> Saving model checkpoint to /content/dissertation/scripts/ner/output
1906
+ [INFO|configuration_utils.py:472] 2024-08-30 20:17:49,539 >> Configuration saved in /content/dissertation/scripts/ner/output/config.json
1907
+ [INFO|modeling_utils.py:2690] 2024-08-30 20:17:50,922 >> Model weights saved in /content/dissertation/scripts/ner/output/model.safetensors
1908
+ [INFO|tokenization_utils_base.py:2574] 2024-08-30 20:17:50,923 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json
1909
+ [INFO|tokenization_utils_base.py:2583] 2024-08-30 20:17:50,923 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json
1910
+ ***** predict metrics *****
1911
+ predict_accuracy = 0.8809
1912
+ predict_f1 = 0.2408
1913
+ predict_loss = 0.6289
1914
+ predict_precision = 0.1378
1915
+ predict_recall = 0.9528
1916
+ predict_runtime = 0:00:29.87
1917
+ predict_samples_per_second = 489.229
1918
+ predict_steps_per_second = 61.162
1919
+
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 9.988249118683902,
3
  "total_flos": 1.2649810588547778e+16,
4
  "train_loss": 0.10639642311544979,
5
- "train_runtime": 1205.6346,
6
  "train_samples": 27229,
7
- "train_samples_per_second": 225.848,
8
- "train_steps_per_second": 3.525
9
  }
 
2
  "epoch": 9.988249118683902,
3
  "total_flos": 1.2649810588547778e+16,
4
  "train_loss": 0.10639642311544979,
5
+ "train_runtime": 1208.2019,
6
  "train_samples": 27229,
7
+ "train_samples_per_second": 225.368,
8
+ "train_steps_per_second": 3.518
9
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.4624414693662204,
3
  "best_model_checkpoint": "/content/dissertation/scripts/ner/output/checkpoint-2127",
4
  "epoch": 9.988249118683902,
5
  "eval_steps": 500,
@@ -10,14 +10,14 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9988249118683902,
13
- "eval_accuracy": 0.8517239485355707,
14
- "eval_f1": 0.4251637936518033,
15
- "eval_loss": 0.3833567500114441,
16
- "eval_precision": 0.29195422381409974,
17
- "eval_recall": 0.7819372952737482,
18
- "eval_runtime": 14.7317,
19
- "eval_samples_per_second": 462.27,
20
- "eval_steps_per_second": 57.835,
21
  "step": 425
22
  },
23
  {
@@ -29,14 +29,14 @@
29
  },
30
  {
31
  "epoch": 2.0,
32
- "eval_accuracy": 0.822140140332569,
33
- "eval_f1": 0.40249737425603915,
34
- "eval_loss": 0.5730458498001099,
35
- "eval_precision": 0.2681125621890547,
36
- "eval_recall": 0.8069723912026205,
37
- "eval_runtime": 14.9036,
38
- "eval_samples_per_second": 456.937,
39
- "eval_steps_per_second": 57.167,
40
  "step": 851
41
  },
42
  {
@@ -48,14 +48,14 @@
48
  },
49
  {
50
  "epoch": 2.99882491186839,
51
- "eval_accuracy": 0.8338185013799827,
52
- "eval_f1": 0.42018044559013074,
53
- "eval_loss": 0.5796028971672058,
54
- "eval_precision": 0.2847990681421083,
55
- "eval_recall": 0.8008890968647637,
56
- "eval_runtime": 14.7541,
57
- "eval_samples_per_second": 461.567,
58
- "eval_steps_per_second": 57.747,
59
  "step": 1276
60
  },
61
  {
@@ -67,14 +67,14 @@
67
  },
68
  {
69
  "epoch": 4.0,
70
- "eval_accuracy": 0.8388097820863142,
71
- "eval_f1": 0.43759863644971914,
72
- "eval_loss": 0.6590859889984131,
73
- "eval_precision": 0.2996455433560993,
74
- "eval_recall": 0.8109499298081423,
75
- "eval_runtime": 14.8634,
76
- "eval_samples_per_second": 458.172,
77
- "eval_steps_per_second": 57.322,
78
  "step": 1702
79
  },
80
  {
@@ -86,14 +86,14 @@
86
  },
87
  {
88
  "epoch": 4.9988249118683905,
89
- "eval_accuracy": 0.8601754843670617,
90
- "eval_f1": 0.4624414693662204,
91
- "eval_loss": 0.6266195774078369,
92
- "eval_precision": 0.32197630636422075,
93
- "eval_recall": 0.8203088441740758,
94
- "eval_runtime": 14.7766,
95
- "eval_samples_per_second": 460.863,
96
- "eval_steps_per_second": 57.659,
97
  "step": 2127
98
  },
99
  {
@@ -105,26 +105,26 @@
105
  },
106
  {
107
  "epoch": 6.0,
108
- "eval_accuracy": 0.8475977316105291,
109
- "eval_f1": 0.44600244420145363,
110
- "eval_loss": 0.7858611941337585,
111
- "eval_precision": 0.3075490109110263,
112
- "eval_recall": 0.8111839026672906,
113
- "eval_runtime": 14.8163,
114
- "eval_samples_per_second": 459.628,
115
- "eval_steps_per_second": 57.504,
116
  "step": 2553
117
  },
118
  {
119
  "epoch": 6.9988249118683905,
120
- "eval_accuracy": 0.8507970944841886,
121
- "eval_f1": 0.45324675324675323,
122
- "eval_loss": 0.829707145690918,
123
- "eval_precision": 0.3136796692432141,
124
- "eval_recall": 0.8165652784277024,
125
- "eval_runtime": 14.8867,
126
- "eval_samples_per_second": 457.456,
127
- "eval_steps_per_second": 57.232,
128
  "step": 2978
129
  },
130
  {
@@ -136,14 +136,14 @@
136
  },
137
  {
138
  "epoch": 8.0,
139
- "eval_accuracy": 0.8532206461889135,
140
- "eval_f1": 0.453628249902988,
141
- "eval_loss": 0.8468152284622192,
142
- "eval_precision": 0.3134608509116911,
143
- "eval_recall": 0.8205428170332242,
144
- "eval_runtime": 15.05,
145
- "eval_samples_per_second": 452.493,
146
- "eval_steps_per_second": 56.611,
147
  "step": 3404
148
  },
149
  {
@@ -155,14 +155,14 @@
155
  },
156
  {
157
  "epoch": 8.99882491186839,
158
- "eval_accuracy": 0.8493827838576352,
159
- "eval_f1": 0.44807482862451153,
160
- "eval_loss": 0.9241161346435547,
161
- "eval_precision": 0.30851345390383766,
162
- "eval_recall": 0.8182030884417407,
163
- "eval_runtime": 14.662,
164
- "eval_samples_per_second": 464.465,
165
- "eval_steps_per_second": 58.109,
166
  "step": 3829
167
  },
168
  {
@@ -174,14 +174,14 @@
174
  },
175
  {
176
  "epoch": 9.988249118683902,
177
- "eval_accuracy": 0.8498565092616749,
178
- "eval_f1": 0.44938176197836166,
179
- "eval_loss": 0.938378632068634,
180
- "eval_precision": 0.31002310289674784,
181
- "eval_recall": 0.816331305568554,
182
- "eval_runtime": 15.4697,
183
- "eval_samples_per_second": 440.215,
184
- "eval_steps_per_second": 55.075,
185
  "step": 4250
186
  },
187
  {
@@ -189,9 +189,9 @@
189
  "step": 4250,
190
  "total_flos": 1.2649810588547778e+16,
191
  "train_loss": 0.10639642311544979,
192
- "train_runtime": 1205.6346,
193
- "train_samples_per_second": 225.848,
194
- "train_steps_per_second": 3.525
195
  }
196
  ],
197
  "logging_steps": 500,
 
1
  {
2
+ "best_metric": 0.17333222008850296,
3
  "best_model_checkpoint": "/content/dissertation/scripts/ner/output/checkpoint-2127",
4
  "epoch": 9.988249118683902,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9988249118683902,
13
+ "eval_accuracy": 0.7849561289082346,
14
+ "eval_f1": 0.1613083366573594,
15
+ "eval_loss": 0.6610585451126099,
16
+ "eval_precision": 0.08832008386476806,
17
+ "eval_recall": 0.9292279411764706,
18
+ "eval_runtime": 14.7703,
19
+ "eval_samples_per_second": 461.06,
20
+ "eval_steps_per_second": 57.683,
21
  "step": 425
22
  },
23
  {
 
29
  },
30
  {
31
  "epoch": 2.0,
32
+ "eval_accuracy": 0.7551182940392986,
33
+ "eval_f1": 0.14506880733944952,
34
+ "eval_loss": 0.9204075932502747,
35
+ "eval_precision": 0.07866915422885572,
36
+ "eval_recall": 0.9301470588235294,
37
+ "eval_runtime": 14.7453,
38
+ "eval_samples_per_second": 461.844,
39
+ "eval_steps_per_second": 57.781,
40
  "step": 851
41
  },
42
  {
 
48
  },
49
  {
50
  "epoch": 2.99882491186839,
51
+ "eval_accuracy": 0.7645035495077375,
52
+ "eval_f1": 0.15487907225146869,
53
+ "eval_loss": 0.9544711709022522,
54
+ "eval_precision": 0.0844496214327315,
55
+ "eval_recall": 0.9329044117647058,
56
+ "eval_runtime": 14.8107,
57
+ "eval_samples_per_second": 459.803,
58
+ "eval_steps_per_second": 57.526,
59
  "step": 1276
60
  },
61
  {
 
67
  },
68
  {
69
  "epoch": 4.0,
70
+ "eval_accuracy": 0.7692064756203056,
71
+ "eval_f1": 0.1618332674832082,
72
+ "eval_loss": 1.0923608541488647,
73
+ "eval_precision": 0.08852770813521224,
74
+ "eval_recall": 0.9411764705882353,
75
+ "eval_runtime": 14.8211,
76
+ "eval_samples_per_second": 459.48,
77
+ "eval_steps_per_second": 57.486,
78
  "step": 1702
79
  },
80
  {
 
86
  },
87
  {
88
  "epoch": 4.9988249118683905,
89
+ "eval_accuracy": 0.7932840841995413,
90
+ "eval_f1": 0.17333222008850296,
91
+ "eval_loss": 1.0502684116363525,
92
+ "eval_precision": 0.09532555790247038,
93
+ "eval_recall": 0.9540441176470589,
94
+ "eval_runtime": 14.797,
95
+ "eval_samples_per_second": 460.229,
96
+ "eval_steps_per_second": 57.579,
97
  "step": 2127
98
  },
99
  {
 
105
  },
106
  {
107
  "epoch": 6.0,
108
+ "eval_accuracy": 0.7787771018990209,
109
+ "eval_f1": 0.16632958498503356,
110
+ "eval_loss": 1.2641881704330444,
111
+ "eval_precision": 0.0911913421449481,
112
+ "eval_recall": 0.9448529411764706,
113
+ "eval_runtime": 14.5753,
114
+ "eval_samples_per_second": 467.228,
115
+ "eval_steps_per_second": 58.455,
116
  "step": 2553
117
  },
118
  {
119
  "epoch": 6.9988249118683905,
120
+ "eval_accuracy": 0.7828758564817994,
121
+ "eval_f1": 0.16898640903880793,
122
+ "eval_loss": 1.3261910676956177,
123
+ "eval_precision": 0.09275570735214812,
124
+ "eval_recall": 0.9485294117647058,
125
+ "eval_runtime": 14.5617,
126
+ "eval_samples_per_second": 467.665,
127
+ "eval_steps_per_second": 58.51,
128
  "step": 2978
129
  },
130
  {
 
136
  },
137
  {
138
  "epoch": 8.0,
139
+ "eval_accuracy": 0.7848943386381424,
140
+ "eval_f1": 0.1687846203975236,
141
+ "eval_loss": 1.3697636127471924,
142
+ "eval_precision": 0.09259921344297461,
143
+ "eval_recall": 0.9522058823529411,
144
+ "eval_runtime": 14.6608,
145
+ "eval_samples_per_second": 464.504,
146
+ "eval_steps_per_second": 58.114,
147
  "step": 3404
148
  },
149
  {
 
155
  },
156
  {
157
  "epoch": 8.99882491186839,
158
+ "eval_accuracy": 0.782223625853049,
159
+ "eval_f1": 0.165499476776946,
160
+ "eval_loss": 1.4433350563049316,
161
+ "eval_precision": 0.09069254521393913,
162
+ "eval_recall": 0.9448529411764706,
163
+ "eval_runtime": 15.0504,
164
+ "eval_samples_per_second": 452.478,
165
+ "eval_steps_per_second": 56.61,
166
  "step": 3829
167
  },
168
  {
 
174
  },
175
  {
176
  "epoch": 9.988249118683902,
177
+ "eval_accuracy": 0.7820794485561674,
178
+ "eval_f1": 0.16674769081186194,
179
+ "eval_loss": 1.4861844778060913,
180
+ "eval_precision": 0.0914341567442687,
181
+ "eval_recall": 0.9457720588235294,
182
+ "eval_runtime": 15.3988,
183
+ "eval_samples_per_second": 442.243,
184
+ "eval_steps_per_second": 55.329,
185
  "step": 4250
186
  },
187
  {
 
189
  "step": 4250,
190
  "total_flos": 1.2649810588547778e+16,
191
  "train_loss": 0.10639642311544979,
192
+ "train_runtime": 1208.2019,
193
+ "train_samples_per_second": 225.368,
194
+ "train_steps_per_second": 3.518
195
  }
196
  ],
197
  "logging_steps": 500,