stulcrad
/

CNEC1_1_extended_xlm-roberta-large

@@ -25,16 +25,16 @@ model-index:
     metrics:
     - name: Precision
       type: precision
-      value: 0.843939393939394
     - name: Recall
       type: recall
-      value: 0.8767051416579223
     - name: F1
       type: f1
-      value: 0.8600102933607823
     - name: Accuracy
       type: accuracy
-      value: 0.9590540063536886
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -44,11 +44,11 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [FacebookAI/xlm-roberta-large](https://huggingface.co/FacebookAI/xlm-roberta-large) on the cnec dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.2330
-- Precision: 0.8439
-- Recall: 0.8767
-- F1: 0.8600
-- Accuracy: 0.9591
 ## Model description
@@ -68,24 +68,30 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 32
-- eval_batch_size: 32
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 25
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
-| 0.6037        | 3.42  | 500  | 0.2144          | 0.6741    | 0.7263 | 0.6993 | 0.9407   |
-| 0.2517        | 6.85  | 1000 | 0.1774          | 0.7915    | 0.8381 | 0.8141 | 0.9575   |
-| 0.1854        | 10.27 | 1500 | 0.1633          | 0.8251    | 0.8621 | 0.8432 | 0.9632   |
-| 0.1476        | 13.7  | 2000 | 0.1610          | 0.8356    | 0.8803 | 0.8574 | 0.9664   |
-| 0.1248        | 17.12 | 2500 | 0.1657          | 0.8459    | 0.8830 | 0.8640 | 0.9682   |
-| 0.1086        | 20.55 | 3000 | 0.1671          | 0.8542    | 0.8862 | 0.8699 | 0.9683   |
-| 0.0985        | 23.97 | 3500 | 0.1610          | 0.8600    | 0.8931 | 0.8762 | 0.9700   |
 ### Framework versions

     metrics:
     - name: Precision
       type: precision
+      value: 0.8567735263702172
     - name: Recall
       type: recall
+      value: 0.8856226616782469
     - name: F1
       type: f1
+      value: 0.8709592641261498
     - name: Accuracy
       type: accuracy
+      value: 0.9657602026679334
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [FacebookAI/xlm-roberta-large](https://huggingface.co/FacebookAI/xlm-roberta-large) on the cnec dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2099
+- Precision: 0.8568
+- Recall: 0.8856
+- F1: 0.8710
+- Accuracy: 0.9658
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 8
+- eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 12
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
+| 0.4598        | 0.86  | 500  | 0.1804          | 0.7750    | 0.8156 | 0.7948 | 0.9556   |
+| 0.2213        | 1.72  | 1000 | 0.1511          | 0.8054    | 0.8338 | 0.8193 | 0.9623   |
+| 0.1614        | 2.58  | 1500 | 0.1517          | 0.8252    | 0.8632 | 0.8438 | 0.9633   |
+| 0.1436        | 3.44  | 2000 | 0.1692          | 0.8207    | 0.8541 | 0.8371 | 0.9619   |
+| 0.1199        | 4.3   | 2500 | 0.1638          | 0.8309    | 0.8589 | 0.8447 | 0.9626   |
+| 0.1076        | 5.16  | 3000 | 0.1710          | 0.8423    | 0.8819 | 0.8616 | 0.9659   |
+| 0.0907        | 6.02  | 3500 | 0.1640          | 0.8366    | 0.8594 | 0.8479 | 0.9651   |
+| 0.0729        | 6.88  | 4000 | 0.1657          | 0.8411    | 0.8658 | 0.8533 | 0.9651   |
+| 0.0678        | 7.75  | 4500 | 0.1919          | 0.8444    | 0.8728 | 0.8583 | 0.9641   |
+| 0.0577        | 8.61  | 5000 | 0.1877          | 0.8429    | 0.8744 | 0.8583 | 0.9644   |
+| 0.0495        | 9.47  | 5500 | 0.1921          | 0.8512    | 0.8803 | 0.8655 | 0.9652   |
+| 0.0462        | 10.33 | 6000 | 0.1952          | 0.8509    | 0.8787 | 0.8646 | 0.9658   |
+| 0.0383        | 11.19 | 6500 | 0.2099          | 0.8568    | 0.8856 | 0.8710 | 0.9658   |
 ### Framework versions

config.json CHANGED Viewed

@@ -3,12 +3,12 @@
   "architectures": [
     "XLMRobertaForTokenClassification"
   ],
-  "attention_probs_dropout_prob": 0.2,
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.4,
   "hidden_size": 1024,
   "id2label": {
     "0": "O",

   "architectures": [
     "XLMRobertaForTokenClassification"
   ],
+  "attention_probs_dropout_prob": 0.25,
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.25,
   "hidden_size": 1024,
   "id2label": {
     "0": "O",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:59bd35b85e3c1ea53167b581e47c0071bf767d9c2a95d08524089d7cc6eb654b
 size 2235473356

 version https://git-lfs.github.com/spec/v1
+oid sha256:b11bd00e1954f7ed11c669792e2d81b588166a305d4b4712ba29b12944d69658
 size 2235473356

tokenizer_config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "added_tokens_decoder": {
     "0": {
       "content": "<s>",

 {
+  "add_prefix_space": true,
   "added_tokens_decoder": {
     "0": {
       "content": "<s>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d950f5cbacd47c735cf795a7bb9260f9ed5e8763601f8428d23f4d02bd12652
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:f673b0ea2252981f0f4d60f8b28f7976a7e2c8590676c86ae69d8fec6a5ac560
 size 4728