add model

Files changed (10) hide show

README.md CHANGED Viewed

@@ -17,9 +17,9 @@ should probably proofread and complete it, then remove this comment. -->
 # distilgpt2-finetuned-distilgpt2-med_articles
-This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 3.5189
 ## Model description
@@ -50,11 +50,11 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| No log        | 1.0   | 260  | 3.6093          |
-| 3.7297        | 2.0   | 520  | 3.5603          |
-| 3.7297        | 3.0   | 780  | 3.5338          |
-| 3.5313        | 4.0   | 1040 | 3.5232          |
-| 3.5313        | 5.0   | 1300 | 3.5189          |
 ### Framework versions

 # distilgpt2-finetuned-distilgpt2-med_articles
+This model is a fine-tuned version of [vishnun/distilgpt2-finetuned-distilgpt2-med_articles](https://huggingface.co/vishnun/distilgpt2-finetuned-distilgpt2-med_articles) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 3.3171
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| No log        | 1.0   | 65   | 3.3417          |
+| No log        | 2.0   | 130  | 3.3300          |
+| No log        | 3.0   | 195  | 3.3231          |
+| No log        | 4.0   | 260  | 3.3172          |
+| No log        | 5.0   | 325  | 3.3171          |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "distilgpt2",
   "_num_labels": 1,
   "activation_function": "gelu_new",
   "architectures": [
@@ -7,6 +7,7 @@
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "gradient_checkpointing": false,
@@ -18,6 +19,7 @@
     "LABEL_0": 0
   },
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
   "n_embd": 768,

 {
+  "_name_or_path": "vishnun/distilgpt2-finetuned-distilgpt2-med_articles",
   "_num_labels": 1,
   "activation_function": "gelu_new",
   "architectures": [
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
+  "do_sample": true,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "gradient_checkpointing": false,
     "LABEL_0": 0
   },
   "layer_norm_epsilon": 1e-05,
+  "max_length": 50,
   "model_type": "gpt2",
   "n_ctx": 1024,
   "n_embd": 768,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f47bdd9cc0f58241e8c3723535e1d140733ebdbdacb62fa8bb46ce5635eb176e
 size 333972957

 version https://git-lfs.github.com/spec/v1
+oid sha256:dcf07f157ab32d63a4f5b38f8a35d99942b7238f8fa6942c2f5b6baff7c030f4
 size 333972957

runs/Aug19_10-11-15_a08bd7a25748/1629367894.5506911/events.out.tfevents.1629367894.a08bd7a25748.75.4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c3d90fe2bfc78c5d9160eda570682b316c0af8ea2f9290578936934c46b3c25
+size 4205

runs/Aug19_10-11-15_a08bd7a25748/events.out.tfevents.1629367894.a08bd7a25748.75.3 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d2de0ab23b294092cccf96814687e15e31e2457274557a7565b8554188c26df8
+size 3375

runs/Aug19_10-13-56_a08bd7a25748/1629368049.1363611/events.out.tfevents.1629368049.a08bd7a25748.75.6 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:78d090efcef9e0f0eb6c14bce900722caf36b59ef95dfdaff7e029bfcef70cab
+size 4205

runs/Aug19_10-13-56_a08bd7a25748/events.out.tfevents.1629368049.a08bd7a25748.75.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:34face3efbf357ecd3930c490a42fc88fa98185be0dd05983a54af725d77630a
+size 5079

runs/Aug19_10-13-56_a08bd7a25748/events.out.tfevents.1629368588.a08bd7a25748.75.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:85654bb00d9b16efc98d373a4e26816aa8ca0b03884fa0d33f6067b10faa2043
+size 311

tokenizer_config.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"unk_token": "<\|endoftext\|>", "bos_token": "<\|endoftext\|>", "eos_token": "<\|endoftext\|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "distilgpt2", "tokenizer_class": "GPT2Tokenizer"}


1	+ {"unk_token": "<\|endoftext\|>", "bos_token": "<\|endoftext\|>", "eos_token": "<\|endoftext\|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "vishnun/distilgpt2-finetuned-distilgpt2-med_articles", "tokenizer_class": "GPT2Tokenizer"}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0405174ec65f57997442cf28a7725916e28a12529b30095d35752bd25f6282c5
 size 2671

 version https://git-lfs.github.com/spec/v1
+oid sha256:90b96e6e0eca55c7c95c3a94a4b717f44b22126fbf53b33be361b11b18bf3964
 size 2671