Training in progress, step 500
Browse files- adapter_config.json +28 -0
- adapter_model.safetensors +3 -0
- merges.txt +0 -0
- runs/May08_11-45-43_180d96a9f229/events.out.tfevents.1715168759.180d96a9f229.6794.0 +3 -0
- runs/May08_12-20-56_180d96a9f229/events.out.tfevents.1715170862.180d96a9f229.19937.0 +3 -0
- runs/May08_12-52-04_180d96a9f229/events.out.tfevents.1715172727.180d96a9f229.30545.0 +3 -0
- runs/May08_12-53-28_180d96a9f229/events.out.tfevents.1715172811.180d96a9f229.30545.1 +3 -0
- runs/May12_06-33-01_4b23207d8454/events.out.tfevents.1715495589.4b23207d8454.3581.0 +3 -0
- runs/May12_06-51-56_4b23207d8454/events.out.tfevents.1715496719.4b23207d8454.9272.0 +3 -0
- runs/May12_06-53-10_4b23207d8454/events.out.tfevents.1715496797.4b23207d8454.9272.1 +3 -0
- runs/May12_08-10-20_4b23207d8454/events.out.tfevents.1715501422.4b23207d8454.9272.2 +3 -0
- runs/May12_08-13-29_4b23207d8454/events.out.tfevents.1715501618.4b23207d8454.9272.3 +3 -0
- runs/May12_08-17-01_4b23207d8454/events.out.tfevents.1715501851.4b23207d8454.9272.4 +3 -0
- runs/May14_13-58-28_8639c74b4083/events.out.tfevents.1715695111.8639c74b4083.230.0 +3 -0
- runs/May14_14-02-12_8639c74b4083/events.out.tfevents.1715695337.8639c74b4083.230.1 +3 -0
- runs/May14_14-30-34_8639c74b4083/events.out.tfevents.1715697046.8639c74b4083.230.2 +3 -0
- runs/May14_14-31-25_8639c74b4083/events.out.tfevents.1715697097.8639c74b4083.230.3 +3 -0
- runs/May14_14-37-45_8639c74b4083/events.out.tfevents.1715697475.8639c74b4083.230.4 +3 -0
- runs/May14_14-41-32_8639c74b4083/events.out.tfevents.1715697701.8639c74b4083.230.5 +3 -0
- special_tokens_map.json +6 -0
- tokenizer.json +0 -0
- tokenizer_config.json +20 -0
- training_args.bin +3 -0
- vocab.json +0 -0
adapter_config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"alpha_pattern": {},
|
3 |
+
"auto_mapping": null,
|
4 |
+
"base_model_name_or_path": "gpt2",
|
5 |
+
"bias": "none",
|
6 |
+
"fan_in_fan_out": true,
|
7 |
+
"inference_mode": true,
|
8 |
+
"init_lora_weights": true,
|
9 |
+
"layer_replication": null,
|
10 |
+
"layers_pattern": null,
|
11 |
+
"layers_to_transform": null,
|
12 |
+
"loftq_config": {},
|
13 |
+
"lora_alpha": 32,
|
14 |
+
"lora_dropout": 0.01,
|
15 |
+
"megatron_config": null,
|
16 |
+
"megatron_core": "megatron.core",
|
17 |
+
"modules_to_save": null,
|
18 |
+
"peft_type": "LORA",
|
19 |
+
"r": 8,
|
20 |
+
"rank_pattern": {},
|
21 |
+
"revision": null,
|
22 |
+
"target_modules": [
|
23 |
+
"c_attn"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM",
|
26 |
+
"use_dora": false,
|
27 |
+
"use_rslora": false
|
28 |
+
}
|
adapter_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c722715e383637b38937318cbdf0c8876d32e7d71a1ddf555575cc884387449
|
3 |
+
size 1182680
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
runs/May08_11-45-43_180d96a9f229/events.out.tfevents.1715168759.180d96a9f229.6794.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c12eb6ac79078923cca8086c71ccafd15e3a5460bdc5f8f7eb9f6f449f40389
|
3 |
+
size 5003
|
runs/May08_12-20-56_180d96a9f229/events.out.tfevents.1715170862.180d96a9f229.19937.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3f362f4920bd9602d9ae0f8f2d45fabb7e733cbf9f10d5aaf8578fd20b132fe
|
3 |
+
size 5003
|
runs/May08_12-52-04_180d96a9f229/events.out.tfevents.1715172727.180d96a9f229.30545.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc618ce6b172446d19aefcca0eeba1df23035b2c5f6917c86322eb43a885b4d2
|
3 |
+
size 5003
|
runs/May08_12-53-28_180d96a9f229/events.out.tfevents.1715172811.180d96a9f229.30545.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac6ca8193d81b241616a59fe4a1ab94e6139c0f319956de8f6e72c540ab9262c
|
3 |
+
size 5003
|
runs/May12_06-33-01_4b23207d8454/events.out.tfevents.1715495589.4b23207d8454.3581.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fce6d89f2311bc5b0384f916892472ca6d1d58b5e90a06eb2a84bed9950f75d
|
3 |
+
size 5351
|
runs/May12_06-51-56_4b23207d8454/events.out.tfevents.1715496719.4b23207d8454.9272.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d0ef7bdb0beea47eabf6d0525e280d328a22d52854f7105597edcf52a355d47
|
3 |
+
size 5003
|
runs/May12_06-53-10_4b23207d8454/events.out.tfevents.1715496797.4b23207d8454.9272.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5886c79c4cc14871ec47e5338dca8902a7fb090d24c4ed21efcde15c6b9ea8d
|
3 |
+
size 5003
|
runs/May12_08-10-20_4b23207d8454/events.out.tfevents.1715501422.4b23207d8454.9272.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de110cd1074f3ffe657bd387f8ac88e97d45f867f6cf4893a338280cd8c43a7a
|
3 |
+
size 5003
|
runs/May12_08-13-29_4b23207d8454/events.out.tfevents.1715501618.4b23207d8454.9272.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9568c44931c16e3ea2ef82b316973b4fb531eea90d537363a3f9b0455a2310e
|
3 |
+
size 5003
|
runs/May12_08-17-01_4b23207d8454/events.out.tfevents.1715501851.4b23207d8454.9272.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f924bb6eba0ca7204710842c2de53c579ad069ea06df6f6518e14dea1e657c3
|
3 |
+
size 88
|
runs/May14_13-58-28_8639c74b4083/events.out.tfevents.1715695111.8639c74b4083.230.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e773f8fa4a36383764a8e8026122569f4293ecbb823bd42a2eb05506953fe44c
|
3 |
+
size 5003
|
runs/May14_14-02-12_8639c74b4083/events.out.tfevents.1715695337.8639c74b4083.230.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e04cc307705f1417becd52e4bd6243c04ab4928d3acc544e29881f4ee20a1baa
|
3 |
+
size 5003
|
runs/May14_14-30-34_8639c74b4083/events.out.tfevents.1715697046.8639c74b4083.230.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09bbd278d956b2fd1443e053a28dfe1aaeaca0a4dea395981cc65f8278957c11
|
3 |
+
size 5001
|
runs/May14_14-31-25_8639c74b4083/events.out.tfevents.1715697097.8639c74b4083.230.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ef2e972bc7da77092136428195def709f5ce74fa8550104eeb0f6b862f709f4
|
3 |
+
size 5003
|
runs/May14_14-37-45_8639c74b4083/events.out.tfevents.1715697475.8639c74b4083.230.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2b0e0cd7abd8e0f6c0bdd62d7997e9ecd54deb0394612db02c440386b3a1ccb
|
3 |
+
size 5004
|
runs/May14_14-41-32_8639c74b4083/events.out.tfevents.1715697701.8639c74b4083.230.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91c0f9af71abbaa2827dc8a9c8ac76e4b8f3820042988d12e2e3f37d7e406f69
|
3 |
+
size 5835
|
special_tokens_map.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "<|endoftext|>",
|
3 |
+
"eos_token": "<|endoftext|>",
|
4 |
+
"pad_token": "<|endoftext|>",
|
5 |
+
"unk_token": "<|endoftext|>"
|
6 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"50256": {
|
5 |
+
"content": "<|endoftext|>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": true,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
}
|
12 |
+
},
|
13 |
+
"bos_token": "<|endoftext|>",
|
14 |
+
"clean_up_tokenization_spaces": true,
|
15 |
+
"eos_token": "<|endoftext|>",
|
16 |
+
"model_max_length": 1024,
|
17 |
+
"pad_token": "<|endoftext|>",
|
18 |
+
"tokenizer_class": "GPT2Tokenizer",
|
19 |
+
"unk_token": "<|endoftext|>"
|
20 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c475bf9240d3a39970e5387e50220cc8085838694a2e5598961db41c3f5fb71
|
3 |
+
size 5048
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|