kearney
/

office-character

@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.3380
-- Accuracy: 0.3293
 ## Model description
@@ -37,51 +37,28 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 3.3e-06
-- train_batch_size: 4
-- eval_batch_size: 4
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 3.0
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
-| 2.2896        | 0.09  | 200  | 2.3458          | 0.328    |
-| 2.3881        | 0.18  | 400  | 2.3456          | 0.3207   |
-| 2.3149        | 0.27  | 600  | 2.3552          | 0.3283   |
-| 2.2579        | 0.36  | 800  | 2.3468          | 0.327    |
-| 2.3016        | 0.45  | 1000 | 2.3512          | 0.327    |
-| 2.3923        | 0.54  | 1200 | 2.3410          | 0.3313   |
-| 2.3458        | 0.63  | 1400 | 2.3416          | 0.328    |
-| 2.3522        | 0.72  | 1600 | 2.3303          | 0.3287   |
-| 2.2485        | 0.81  | 1800 | 2.3291          | 0.3343   |
-| 2.3083        | 0.9   | 2000 | 2.3289          | 0.3327   |
-| 2.2594        | 0.99  | 2200 | 2.3336          | 0.3387   |
-| 2.229         | 1.08  | 2400 | 2.3446          | 0.3213   |
-| 2.3017        | 1.17  | 2600 | 2.3362          | 0.3327   |
-| 2.2405        | 1.26  | 2800 | 2.3299          | 0.335    |
-| 2.3291        | 1.35  | 3000 | 2.3291          | 0.33     |
-| 2.2518        | 1.43  | 3200 | 2.3363          | 0.3297   |
-| 2.268         | 1.52  | 3400 | 2.3623          | 0.3187   |
-| 2.3198        | 1.61  | 3600 | 2.3480          | 0.3277   |
-| 2.1873        | 1.7   | 3800 | 2.3355          | 0.3293   |
-| 2.2634        | 1.79  | 4000 | 2.3291          | 0.326    |
-| 2.1011        | 1.88  | 4200 | 2.3345          | 0.333    |
-| 2.1965        | 1.97  | 4400 | 2.3383          | 0.3293   |
-| 2.2368        | 2.06  | 4600 | 2.3320          | 0.329    |
-| 2.2226        | 2.15  | 4800 | 2.3453          | 0.3263   |
-| 2.2354        | 2.24  | 5000 | 2.3372          | 0.33     |
-| 2.2829        | 2.33  | 5200 | 2.3547          | 0.3223   |
-| 2.1544        | 2.42  | 5400 | 2.3336          | 0.3287   |
-| 2.2777        | 2.51  | 5600 | 2.3425          | 0.3283   |
-| 2.0763        | 2.6   | 5800 | 2.3339          | 0.3307   |
-| 2.2738        | 2.69  | 6000 | 2.3389          | 0.3293   |
-| 2.1013        | 2.78  | 6200 | 2.3411          | 0.327    |
-| 2.1058        | 2.87  | 6400 | 2.3357          | 0.332    |
-| 2.1621        | 2.96  | 6600 | 2.3380          | 0.3293   |
 ### Framework versions

 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.5779
+- Accuracy: 0.2597
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 3.3e-05
+- train_batch_size: 20
+- eval_batch_size: 10
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 1.0
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
+| No log        | 0.09  | 200  | 2.6170          | 0.2412   |
+| No log        | 0.19  | 400  | 2.6193          | 0.2412   |
+| No log        | 0.28  | 600  | 2.6109          | 0.2519   |
+| No log        | 0.37  | 800  | 2.5937          | 0.2551   |
+| No log        | 0.47  | 1000 | 2.5840          | 0.2607   |
+| No log        | 0.56  | 1200 | 2.5814          | 0.2620   |
+| No log        | 0.66  | 1400 | 2.5889          | 0.2535   |
+| No log        | 0.75  | 1600 | 2.5779          | 0.2595   |
+| No log        | 0.84  | 1800 | 2.5752          | 0.2622   |
+| 2.4849        | 0.94  | 2000 | 2.5779          | 0.2597   |
 ### Framework versions

config.json CHANGED Viewed

@@ -9,91 +9,71 @@
   "dropout": 0.1,
   "hidden_dim": 3072,
   "id2label": {
-    "0": "Abby",
-    "1": "Andy",
-    "2": "Angela",
-    "3": "Billy Merchant",
-    "4": "Captain Jack",
-    "5": "Carol",
-    "6": "Christian",
-    "7": "Craig",
-    "8": "Creed",
-    "9": "Darryl",
-    "10": "David",
-    "11": "Dwight",
-    "12": "Hannah",
-    "13": "Improv Teacher",
-    "14": "Jake",
-    "15": "Jan",
-    "16": "Jim",
-    "17": "Josh",
-    "18": "Karen",
-    "19": "Katy",
-    "20": "Kelly",
-    "21": "Kevin",
-    "22": "Martin",
-    "23": "Mary-Beth",
-    "24": "Melissa",
-    "25": "Meredith",
-    "26": "Michael",
-    "27": "Mr. Brown",
-    "28": "Oscar",
-    "29": "Pam",
-    "30": "Pam's Mom",
-    "31": "Photographer",
-    "32": "Phyllis",
-    "33": "Roy",
-    "34": "Ryan",
-    "35": "Sadiq (IT guy)",
-    "36": "Second Cindy",
-    "37": "Stanley",
-    "38": "Toby",
-    "39": "Todd Packer",
-    "40": "Tony"
   },
   "initializer_range": 0.02,
   "label2id": {
-    "Abby": 0,
-    "Andy": 1,
-    "Angela": 2,
-    "Billy Merchant": 3,
-    "Captain Jack": 4,
-    "Carol": 5,
-    "Christian": 6,
-    "Craig": 7,
-    "Creed": 8,
-    "Darryl": 9,
-    "David": 10,
-    "Dwight": 11,
-    "Hannah": 12,
-    "Improv Teacher": 13,
-    "Jake": 14,
-    "Jan": 15,
-    "Jim": 16,
-    "Josh": 17,
-    "Karen": 18,
-    "Katy": 19,
-    "Kelly": 20,
-    "Kevin": 21,
-    "Martin": 22,
-    "Mary-Beth": 23,
-    "Melissa": 24,
-    "Meredith": 25,
-    "Michael": 26,
-    "Mr. Brown": 27,
-    "Oscar": 28,
-    "Pam": 29,
-    "Pam's Mom": 30,
-    "Photographer": 31,
-    "Phyllis": 32,
-    "Roy": 33,
-    "Ryan": 34,
-    "Sadiq (IT guy)": 35,
-    "Second Cindy": 36,
-    "Stanley": 37,
-    "Toby": 38,
-    "Todd Packer": 39,
-    "Tony": 40
   },
   "max_position_embeddings": 512,
   "model_type": "distilbert",

   "dropout": 0.1,
   "hidden_dim": 3072,
   "id2label": {
+    "0": "Andy",
+    "1": "Angela",
+    "2": "Charles",
+    "3": "Clark",
+    "4": "Creed",
+    "5": "Darryl",
+    "6": "David",
+    "7": "David Wallace",
+    "8": "Deangelo",
+    "9": "Dwight",
+    "10": "Erin",
+    "11": "Gabe",
+    "12": "Holly",
+    "13": "Jan",
+    "14": "Jim",
+    "15": "Jo",
+    "16": "Karen",
+    "17": "Kelly",
+    "18": "Kevin",
+    "19": "Meredith",
+    "20": "Michael",
+    "21": "Nellie",
+    "22": "Oscar",
+    "23": "Pam",
+    "24": "Pete",
+    "25": "Phyllis",
+    "26": "Robert",
+    "27": "Roy",
+    "28": "Ryan",
+    "29": "Stanley",
+    "30": "Toby"
   },
   "initializer_range": 0.02,
   "label2id": {
+    "Andy": 0,
+    "Angela": 1,
+    "Charles": 2,
+    "Clark": 3,
+    "Creed": 4,
+    "Darryl": 5,
+    "David": 6,
+    "David Wallace": 7,
+    "Deangelo": 8,
+    "Dwight": 9,
+    "Erin": 10,
+    "Gabe": 11,
+    "Holly": 12,
+    "Jan": 13,
+    "Jim": 14,
+    "Jo": 15,
+    "Karen": 16,
+    "Kelly": 17,
+    "Kevin": 18,
+    "Meredith": 19,
+    "Michael": 20,
+    "Nellie": 21,
+    "Oscar": 22,
+    "Pam": 23,
+    "Pete": 24,
+    "Phyllis": 25,
+    "Robert": 26,
+    "Roy": 27,
+    "Ryan": 28,
+    "Stanley": 29,
+    "Toby": 30
   },
   "max_position_embeddings": 512,
   "model_type": "distilbert",

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:72b97b1c1cc234dc3e7806a83c7d8514b3e38703205a8945e6df8364bef8ac96
-size 267974061

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1fad4844e4cbb392ef4d15409f2d3caaf911c6cfc9cae9693780f4d0177eea9
+size 267943341

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca52886750a1b05ad2f299bbcecea11da584901c2158abc7f50677a847705e2b
 size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:1cc712bb79d6cd37b9b82ff868848d83639f4677e1d1eef5be7989eeafb38c23
 size 4027