mwoelki commited on
Commit
270ab1b
1 Parent(s): d0ad332

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,30 +1,21 @@
1
  {
2
- "_name_or_path": "distilbert/distilgpt2",
3
- "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
6
  "GPT2LMHeadModel"
7
  ],
8
  "attn_pdrop": 0.1,
9
  "bos_token_id": 50256,
10
- "do_sample": true,
11
  "embd_pdrop": 0.1,
12
  "eos_token_id": 50256,
13
- "id2label": {
14
- "0": "LABEL_0"
15
- },
16
  "initializer_range": 0.02,
17
- "label2id": {
18
- "LABEL_0": 0
19
- },
20
  "layer_norm_epsilon": 1e-05,
21
- "max_length": 50,
22
  "model_type": "gpt2",
23
  "n_ctx": 1024,
24
  "n_embd": 768,
25
  "n_head": 12,
26
  "n_inner": null,
27
- "n_layer": 6,
28
  "n_positions": 1024,
29
  "reorder_and_upcast_attn": false,
30
  "resid_pdrop": 0.1,
 
1
  {
2
+ "_name_or_path": "gpt2",
 
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
 
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
 
 
 
11
  "initializer_range": 0.02,
 
 
 
12
  "layer_norm_epsilon": 1e-05,
 
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
16
  "n_head": 12,
17
  "n_inner": null,
18
+ "n_layer": 12,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9d223556906b98f28cdd2295c15255c62d86fb94b8b949588c135f116f31555
3
- size 327657928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49575472d18824b10eddb72c1abeb23409f275e144bcec177bcc26209d569bc
3
+ size 497774208
runs/Jun15_08-40-22_3981491d00a1/events.out.tfevents.1718440823.3981491d00a1.941.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16f4f92b8f146bb2efef8d1854103bf7ac854d330875393ce655cc8fedf38b86
3
- size 6263
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed7ea4757eb9194caa4e063ac9335557b68268a76adca9127764b23f58b657da
3
+ size 6888
runs/Jun15_08-40-22_3981491d00a1/events.out.tfevents.1718441203.3981491d00a1.941.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d8874de3f678b1ab75a08ecfd6f24d5d557be54a82d0136b00b2a21dc4b1994
3
+ size 359
runs/Jun15_09-20-48_3981491d00a1/events.out.tfevents.1718443249.3981491d00a1.941.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9550f63b55e4202e1965fb56b504b83c1e65456cefac363ea3e63045d741fce
3
+ size 5598
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb20a334e63fcedd4e934ce03976286990a9087a15b98001cf943e72a8df26f5
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51e9e940e2056f53df545b821f8946ce63f4ded8bafc5a28b604f2c3fa46333e
3
  size 5176