Model save

Browse files

Files changed (8) hide show

README.md +19 -29
config.json +1 -1
eval_results.json +6 -6
logs/events.out.tfevents.1722374450.nathan.153742.0 +3 -0
logs/events.out.tfevents.1722374714.nathan.153742.1 +3 -0
model.safetensors +1 -1
run_config.json +4 -4
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [docketanalyzer/docket-lm-xs](https://huggingface.co/docketanalyzer/docket-lm-xs) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.0048
-- F1: 0.9995
 ## Model description
@@ -45,40 +45,30 @@ The following hyperparameters were used during training:
 - total_train_batch_size: 16
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- lr_scheduler_warmup_steps: 100
 - num_epochs: 1
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | F1     |
-|:-------------:|:------:|:----:|:---------------:|:------:|
-| 0.0017        | 0.0435 | 300  | 0.0115          | 0.9976 |
-| 0.0011        | 0.0870 | 600  | 0.0133          | 0.9978 |
-| 0.0022        | 0.1305 | 900  | 0.0116          | 0.9972 |
-| 0.0002        | 0.1740 | 1200 | 0.0127          | 0.9981 |
-| 0.0005        | 0.2175 | 1500 | 0.0092          | 0.9981 |
-| 0.0002        | 0.2611 | 1800 | 0.0120          | 0.9979 |
-| 0.0002        | 0.3046 | 2100 | 0.0079          | 0.9985 |
-| 0.0001        | 0.3481 | 2400 | 0.0146          | 0.9961 |
-| 0.0003        | 0.3916 | 2700 | 0.0075          | 0.9988 |
-| 0.0003        | 0.4351 | 3000 | 0.0088          | 0.9986 |
-| 0.0001        | 0.4786 | 3300 | 0.0095          | 0.9988 |
-| 0.0001        | 0.5221 | 3600 | 0.0067          | 0.9991 |
-| 0.0001        | 0.5656 | 3900 | 0.0077          | 0.9990 |
-| 0.0001        | 0.6091 | 4200 | 0.0084          | 0.9985 |
-| 0.0001        | 0.6526 | 4500 | 0.0049          | 0.9995 |
-| 0.0347        | 0.6962 | 4800 | 0.0056          | 0.9993 |
-| 0.0001        | 0.7397 | 5100 | 0.0067          | 0.9988 |
-| 0.0016        | 0.7832 | 5400 | 0.0068          | 0.9986 |
-| 0.0001        | 0.8267 | 5700 | 0.0054          | 0.9990 |
-| 0.0001        | 0.8702 | 6000 | 0.0053          | 0.9991 |
-| 0.0872        | 0.9137 | 6300 | 0.0048          | 0.9995 |
-| 0.0001        | 0.9572 | 6600 | 0.0048          | 0.9995 |
 ### Framework versions
-- Transformers 4.41.1
-- Pytorch 2.3.0+cu121
 - Datasets 2.14.4
 - Tokenizers 0.19.1

 This model is a fine-tuned version of [docketanalyzer/docket-lm-xs](https://huggingface.co/docketanalyzer/docket-lm-xs) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.0121
+- F1: 0.9981
 ## Model description
 - total_train_batch_size: 16
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- lr_scheduler_warmup_ratio: 0.02
 - num_epochs: 1
 ### Training results
+| Training Loss | Epoch | Step | Validation Loss | F1     |
+|:-------------:|:-----:|:----:|:---------------:|:------:|
+| 0.0312        | 0.08  | 95   | 0.0374          | 0.9923 |
+| 0.0035        | 0.16  | 190  | 0.0096          | 0.9981 |
+| 0.0022        | 0.24  | 285  | 0.0068          | 0.9990 |
+| 0.0016        | 0.32  | 380  | 0.0143          | 0.9971 |
+| 0.0012        | 0.4   | 475  | 0.0124          | 0.9981 |
+| 0.0013        | 0.48  | 570  | 0.0127          | 0.9981 |
+| 0.0012        | 0.56  | 665  | 0.0114          | 0.9981 |
+| 0.0011        | 0.64  | 760  | 0.0130          | 0.9981 |
+| 0.001         | 0.72  | 855  | 0.0117          | 0.9981 |
+| 0.0005        | 0.8   | 950  | 0.0130          | 0.9981 |
+| 0.0005        | 0.88  | 1045 | 0.0118          | 0.9981 |
+| 0.0005        | 0.96  | 1140 | 0.0126          | 0.9981 |
 ### Framework versions
+- Transformers 4.43.3
+- Pytorch 2.3.1+cu121
 - Datasets 2.14.4
 - Tokenizers 0.19.1

config.json CHANGED Viewed

@@ -37,7 +37,7 @@
   "relative_attention": true,
   "share_att_key": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.41.1",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

   "relative_attention": true,
   "share_att_key": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.43.3",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

eval_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "eval_loss": 0.004779691807925701,
-    "eval_f1": 0.999485155311481,
-    "eval_runtime": 19.4506,
-    "eval_samples_per_second": 298.5,
-    "eval_steps_per_second": 18.663,
-    "epoch": 1.0
 }

 {
+    "eval_loss": 0.012090153060853481,
+    "eval_f1": 0.9980582524271845,
+    "eval_runtime": 3.2065,
+    "eval_samples_per_second": 311.867,
+    "eval_steps_per_second": 19.648,
+    "epoch": 0.999578947368421
 }

logs/events.out.tfevents.1722374450.nathan.153742.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:557aed47c2037a606ad7d9eeb6eb643c62e2e9e706445991bee346af3d72ec89
+size 134323

logs/events.out.tfevents.1722374714.nathan.153742.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0d88cbe0a24e9a047ad614b89b1ea913289224d182b56e20e2361783d9b5529d
+size 405

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e1266d7a450140330afab29beb86e9f6fa0e5bb5218d67a0c223ab027937ac8b
 size 283347432

 version https://git-lfs.github.com/spec/v1
+oid sha256:e16ee7f54b2c1219c0e6a0bfc4330695714db5ebef98be08a0e2742c481eb8fe
 size 283347432

run_config.json CHANGED Viewed

@@ -10,12 +10,12 @@
         "gradient_accumulation_steps": 2,
         "learning_rate": 5e-05,
         "weight_decay": 0.1,
-        "warmup_steps": 100,
         "evaluation_strategy": "steps",
-        "eval_steps": 300,
-        "save_steps": 300,
         "save_total_limit": 2
     },
-    "run_name": "initial_model",
     "run_type": "ClassificationRoutine"
 }

         "gradient_accumulation_steps": 2,
         "learning_rate": 5e-05,
         "weight_decay": 0.1,
+        "warmup_ratio": 0.02,
         "evaluation_strategy": "steps",
+        "eval_steps": 0.08,
+        "save_steps": 0.08,
         "save_total_limit": 2
     },
+    "run_name": "complaint",
     "run_type": "ClassificationRoutine"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3656fcbc1832dd9c0867ba00d4106f7f2d6ac5ab8dfe75730fee3152c51822ce
-size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:66ef2207833c0afa403c72448d2b06f189c7278d0be4661827287b01ffc17100
+size 5240