Training complete

Browse files

Files changed (8) hide show

README.md +5 -22
merges.txt +0 -0
model.safetensors +1 -1
special_tokens_map.json +7 -1
tokenizer.json +0 -0
tokenizer_config.json +11 -8
training_args.bin +1 -1
vocab.json +0 -0

README.md CHANGED Viewed

@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [vinai/phobert-base](https://huggingface.co/vinai/phobert-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.7735
 ## Model description
@@ -40,32 +40,15 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 20
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| No log        | 1.0   | 347  | 1.2051          |
-| 1.3864        | 2.0   | 694  | 1.1012          |
-| 0.8986        | 3.0   | 1041 | 1.0558          |
-| 0.8986        | 4.0   | 1388 | 1.1254          |
-| 0.6019        | 5.0   | 1735 | 1.4252          |
-| 0.3972        | 6.0   | 2082 | 1.5207          |
-| 0.3972        | 7.0   | 2429 | 1.6013          |
-| 0.2536        | 8.0   | 2776 | 1.8216          |
-| 0.1597        | 9.0   | 3123 | 2.0175          |
-| 0.1597        | 10.0  | 3470 | 2.0884          |
-| 0.1262        | 11.0  | 3817 | 2.3397          |
-| 0.0789        | 12.0  | 4164 | 2.4385          |
-| 0.0545        | 13.0  | 4511 | 2.5664          |
-| 0.0545        | 14.0  | 4858 | 2.6797          |
-| 0.0312        | 15.0  | 5205 | 2.7723          |
-| 0.032         | 16.0  | 5552 | 2.8236          |
-| 0.032         | 17.0  | 5899 | 2.7557          |
-| 0.0237        | 18.0  | 6246 | 2.8256          |
-| 0.0157        | 19.0  | 6593 | 2.8168          |
-| 0.0157        | 20.0  | 6940 | 2.8602          |
 ### Framework versions

 This model is a fine-tuned version of [vinai/phobert-base](https://huggingface.co/vinai/phobert-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.5672
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 3
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| No log        | 1.0   | 347  | 1.6831          |
+| 1.73          | 2.0   | 694  | 1.5771          |
+| 1.579         | 3.0   | 1041 | 1.5432          |
 ### Framework versions

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b9fd1ae500ef8a785c6af1b4a0bd79cfedeaeebe29a717b88ef188ae56c76945
 size 540038764

 version https://git-lfs.github.com/spec/v1
+oid sha256:f5c73d8ae78b018520f1b3486cca36391c1da668efd922b29c10cf3609728520
 size 540038764

special_tokens_map.json CHANGED Viewed

@@ -2,7 +2,13 @@
   "bos_token": "<s>",
   "cls_token": "<s>",
   "eos_token": "</s>",
-  "mask_token": "<mask>",
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "unk_token": "<unk>"

   "bos_token": "<s>",
   "cls_token": "<s>",
   "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "unk_token": "<unk>"

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,9 +1,10 @@
 {
   "added_tokens_decoder": {
     "0": {
       "content": "<s>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -11,7 +12,7 @@
     "1": {
       "content": "<pad>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -19,7 +20,7 @@
     "2": {
       "content": "</s>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -27,14 +28,14 @@
     "3": {
       "content": "<unk>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "64000": {
       "content": "<mask>",
-      "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
@@ -45,10 +46,12 @@
   "clean_up_tokenization_spaces": true,
   "cls_token": "<s>",
   "eos_token": "</s>",
   "mask_token": "<mask>",
-  "model_max_length": 256,
   "pad_token": "<pad>",
   "sep_token": "</s>",
-  "tokenizer_class": "PhobertTokenizer",
   "unk_token": "<unk>"
 }

 {
+  "add_prefix_space": false,
   "added_tokens_decoder": {
     "0": {
       "content": "<s>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     "1": {
       "content": "<pad>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     "2": {
       "content": "</s>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     "3": {
       "content": "<unk>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "50264": {
       "content": "<mask>",
+      "lstrip": true,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
   "clean_up_tokenization_spaces": true,
   "cls_token": "<s>",
   "eos_token": "</s>",
+  "errors": "replace",
   "mask_token": "<mask>",
+  "model_max_length": 512,
   "pad_token": "<pad>",
   "sep_token": "</s>",
+  "tokenizer_class": "RobertaTokenizer",
+  "trim_offsets": true,
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96881f394cfa44b064512fb5838114d0d9a17143da019e5ba08fb43d581b8bdb
 size 4536

 version https://git-lfs.github.com/spec/v1
+oid sha256:537fabe3c89dfe34e9ac617891ebd37ab6965e8a1462b1be57f16c8dab26607f
 size 4536

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff