End of training
Browse files- README.md +4 -4
- config.json +2 -0
- generation_config.json +3 -0
- model.safetensors +1 -1
- runs/Jun15_11-37-46_8423c480c5d4/events.out.tfevents.1718451467.8423c480c5d4.3030.2 +3 -0
- runs/Jun15_11-38-20_8423c480c5d4/events.out.tfevents.1718451501.8423c480c5d4.3030.3 +3 -0
- runs/Jun15_11-41-21_8423c480c5d4/events.out.tfevents.1718451681.8423c480c5d4.3030.4 +3 -0
- runs/Jun15_11-45-10_8423c480c5d4/events.out.tfevents.1718451910.8423c480c5d4.3030.5 +3 -0
- runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452299.8423c480c5d4.3030.6 +3 -0
- runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452320.8423c480c5d4.3030.7 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
15 |
|
16 |
This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on the None dataset.
|
17 |
It achieves the following results on the evaluation set:
|
18 |
-
- Loss:
|
19 |
|
20 |
## Model description
|
21 |
|
@@ -46,9 +46,9 @@ The following hyperparameters were used during training:
|
|
46 |
|
47 |
| Training Loss | Epoch | Step | Validation Loss |
|
48 |
|:-------------:|:-----:|:----:|:---------------:|
|
49 |
-
| No log | 1.0 |
|
50 |
-
|
|
51 |
-
|
|
52 |
|
53 |
|
54 |
### Framework versions
|
|
|
15 |
|
16 |
This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on the None dataset.
|
17 |
It achieves the following results on the evaluation set:
|
18 |
+
- Loss: 3.2714
|
19 |
|
20 |
## Model description
|
21 |
|
|
|
46 |
|
47 |
| Training Loss | Epoch | Step | Validation Loss |
|
48 |
|:-------------:|:-----:|:----:|:---------------:|
|
49 |
+
| No log | 1.0 | 3 | 3.5388 |
|
50 |
+
| No log | 2.0 | 6 | 3.3409 |
|
51 |
+
| No log | 3.0 | 9 | 3.2714 |
|
52 |
|
53 |
|
54 |
### Framework versions
|
config.json
CHANGED
@@ -6,10 +6,12 @@
|
|
6 |
],
|
7 |
"attn_pdrop": 0.1,
|
8 |
"bos_token_id": 50256,
|
|
|
9 |
"embd_pdrop": 0.1,
|
10 |
"eos_token_id": 50256,
|
11 |
"initializer_range": 0.02,
|
12 |
"layer_norm_epsilon": 1e-05,
|
|
|
13 |
"model_type": "gpt2",
|
14 |
"n_ctx": 1024,
|
15 |
"n_embd": 768,
|
|
|
6 |
],
|
7 |
"attn_pdrop": 0.1,
|
8 |
"bos_token_id": 50256,
|
9 |
+
"do_sample": true,
|
10 |
"embd_pdrop": 0.1,
|
11 |
"eos_token_id": 50256,
|
12 |
"initializer_range": 0.02,
|
13 |
"layer_norm_epsilon": 1e-05,
|
14 |
+
"max_length": 50,
|
15 |
"model_type": "gpt2",
|
16 |
"n_ctx": 1024,
|
17 |
"n_embd": 768,
|
generation_config.json
CHANGED
@@ -1,6 +1,9 @@
|
|
1 |
{
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 50256,
|
|
|
4 |
"eos_token_id": 50256,
|
|
|
|
|
5 |
"transformers_version": "4.41.2"
|
6 |
}
|
|
|
1 |
{
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 50256,
|
4 |
+
"do_sample": true,
|
5 |
"eos_token_id": 50256,
|
6 |
+
"max_length": 50,
|
7 |
+
"pad_token_id": 50256,
|
8 |
"transformers_version": "4.41.2"
|
9 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 497774208
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49c4672d24e79732c642c6803783920d9b18e29aa70b71ced578c5be7f4b0f66
|
3 |
size 497774208
|
runs/Jun15_11-37-46_8423c480c5d4/events.out.tfevents.1718451467.8423c480c5d4.3030.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63a8feba4ecd2b4058f611c4c9a7321f1067c18de90a9e868d8d88fb5e79feb2
|
3 |
+
size 5116
|
runs/Jun15_11-38-20_8423c480c5d4/events.out.tfevents.1718451501.8423c480c5d4.3030.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98eb91ac308465de21d3eec43032b70f6c2084379d57116dfbbb678f3c0d3ce7
|
3 |
+
size 5116
|
runs/Jun15_11-41-21_8423c480c5d4/events.out.tfevents.1718451681.8423c480c5d4.3030.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c65768e041b731fe4f65604fe5dedae86b5aec4a83055ce62f20f7942e0fa1e
|
3 |
+
size 5116
|
runs/Jun15_11-45-10_8423c480c5d4/events.out.tfevents.1718451910.8423c480c5d4.3030.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36e3a3003f1796531ba8fd2cb5f545a13bc98bbef284726eaf4b997d16bb78f6
|
3 |
+
size 5116
|
runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452299.8423c480c5d4.3030.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c8c0f5b486e5db013375e94f8c9398e517c3e03b05a3edaa22e0edd173f877d
|
3 |
+
size 6262
|
runs/Jun15_11-51-39_8423c480c5d4/events.out.tfevents.1718452320.8423c480c5d4.3030.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:436ac86bd38772dffb592815916175ab7abe4b72230a1c3886a9fed7edef1386
|
3 |
+
size 354
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:766b3c4cd493c10475b8fddb906959a4abee22819d32a7ec7188882a59e595f2
|
3 |
size 5176
|