mwoelki commited on
Commit
120ab0a
1 Parent(s): 40dd8ee

End of training

Browse files
README.md CHANGED
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 1.1487
19
 
20
  ## Model description
21
 
@@ -46,9 +46,9 @@ The following hyperparameters were used during training:
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
- | No log | 1.0 | 495 | 1.2865 |
50
- | 1.6273 | 2.0 | 990 | 1.1770 |
51
- | 1.3219 | 3.0 | 1485 | 1.1487 |
52
 
53
 
54
  ### Framework versions
 
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 3.2714
19
 
20
  ## Model description
21
 
 
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
+ | No log | 1.0 | 3 | 3.5388 |
50
+ | No log | 2.0 | 6 | 3.3409 |
51
+ | No log | 3.0 | 9 | 3.2714 |
52
 
53
 
54
  ### Framework versions
config.json CHANGED
@@ -6,10 +6,12 @@
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
 
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
 
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
 
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
9
+ "do_sample": true,
10
  "embd_pdrop": 0.1,
11
  "eos_token_id": 50256,
12
  "initializer_range": 0.02,
13
  "layer_norm_epsilon": 1e-05,
14
+ "max_length": 50,
15
  "model_type": "gpt2",
16
  "n_ctx": 1024,
17
  "n_embd": 768,
generation_config.json CHANGED
@@ -1,6 +1,9 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
 
4
  "eos_token_id": 50256,
 
 
5
  "transformers_version": "4.41.2"
6
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
4
+ "do_sample": true,
5
  "eos_token_id": 50256,
6
+ "max_length": 50,
7
+ "pad_token_id": 50256,
8
  "transformers_version": "4.41.2"
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2116a6390a20e1d15f39736be47286f60308ac8c0a21fadf8484bced1542c2f
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49c4672d24e79732c642c6803783920d9b18e29aa70b71ced578c5be7f4b0f66
3
  size 497774208
runs/Jun15_11-37-46_8423c480c5d4/events.out.tfevents.1718451467.8423c480c5d4.3030.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a8feba4ecd2b4058f611c4c9a7321f1067c18de90a9e868d8d88fb5e79feb2
3
+ size 5116
runs/Jun15_11-38-20_8423c480c5d4/events.out.tfevents.1718451501.8423c480c5d4.3030.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98eb91ac308465de21d3eec43032b70f6c2084379d57116dfbbb678f3c0d3ce7
3
+ size 5116
runs/Jun15_11-41-21_8423c480c5d4/events.out.tfevents.1718451681.8423c480c5d4.3030.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c65768e041b731fe4f65604fe5dedae86b5aec4a83055ce62f20f7942e0fa1e
3
+ size 5116
runs/Jun15_11-45-10_8423c480c5d4/events.out.tfevents.1718451910.8423c480c5d4.3030.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36e3a3003f1796531ba8fd2cb5f545a13bc98bbef284726eaf4b997d16bb78f6
3
+ size 5116
runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452299.8423c480c5d4.3030.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c8c0f5b486e5db013375e94f8c9398e517c3e03b05a3edaa22e0edd173f877d
3
+ size 6262
runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452320.8423c480c5d4.3030.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436ac86bd38772dffb592815916175ab7abe4b72230a1c3886a9fed7edef1386
3
+ size 354
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7756109a9c95e98e3b9452ad49f0dbebfe093dcbc4d51a3f21f715bd510a374a
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:766b3c4cd493c10475b8fddb906959a4abee22819d32a7ec7188882a59e595f2
3
  size 5176