Training in progress, step 50
Browse files- adapter_config.json +34 -0
- adapter_model.safetensors +3 -0
- runs/Feb17_11-37-15_gpu3/events.out.tfevents.1739792277.gpu3.128186.0 +3 -0
- runs/Feb17_11-43-05_gpu3/events.out.tfevents.1739792594.gpu3.129620.0 +3 -0
- runs/Feb18_13-15-53_gpu3/events.out.tfevents.1739884560.gpu3.146287.0 +3 -0
- runs/Feb18_13-16-30_gpu3/events.out.tfevents.1739884598.gpu3.146287.1 +3 -0
- runs/Feb18_14-21-25_gpu3/events.out.tfevents.1739888488.gpu3.150125.0 +3 -0
- runs/Feb18_14-22-35_gpu3/events.out.tfevents.1739888558.gpu3.150383.0 +3 -0
- training_args.bin +3 -0
adapter_config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"alpha_pattern": {},
|
3 |
+
"auto_mapping": null,
|
4 |
+
"base_model_name_or_path": "bigcode/starcoderbase-3b",
|
5 |
+
"bias": "none",
|
6 |
+
"eva_config": null,
|
7 |
+
"exclude_modules": null,
|
8 |
+
"fan_in_fan_out": false,
|
9 |
+
"inference_mode": true,
|
10 |
+
"init_lora_weights": true,
|
11 |
+
"layer_replication": null,
|
12 |
+
"layers_pattern": null,
|
13 |
+
"layers_to_transform": null,
|
14 |
+
"loftq_config": {},
|
15 |
+
"lora_alpha": 16,
|
16 |
+
"lora_bias": false,
|
17 |
+
"lora_dropout": 0.0,
|
18 |
+
"megatron_config": null,
|
19 |
+
"megatron_core": "megatron.core",
|
20 |
+
"modules_to_save": null,
|
21 |
+
"peft_type": "LORA",
|
22 |
+
"r": 4,
|
23 |
+
"rank_pattern": {},
|
24 |
+
"revision": null,
|
25 |
+
"target_modules": [
|
26 |
+
"q_attn",
|
27 |
+
"c_proj",
|
28 |
+
"c_fc",
|
29 |
+
"c_attn"
|
30 |
+
],
|
31 |
+
"task_type": "CAUSAL_LM",
|
32 |
+
"use_dora": false,
|
33 |
+
"use_rslora": false
|
34 |
+
}
|
adapter_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db1a24d5c9a74ffe3f9ffb0aac041c8ce6da225e9011d318ef3bf4666f698b4e
|
3 |
+
size 22892576
|
runs/Feb17_11-37-15_gpu3/events.out.tfevents.1739792277.gpu3.128186.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0f34c0ac3268c6a2a5ef2cb31299c5c78cf9297c662d69ad79b318084b93c01
|
3 |
+
size 4184
|
runs/Feb17_11-43-05_gpu3/events.out.tfevents.1739792594.gpu3.129620.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f7a8667b7190cab407b2a784415a77aefb83dc5bf2745cc87c89d7766fbe4fd
|
3 |
+
size 5652
|
runs/Feb18_13-15-53_gpu3/events.out.tfevents.1739884560.gpu3.146287.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fac3bf60f7934eaeb62c72c0ebaf673330f541e4cb69c1277f2f9cb33b7fbb2
|
3 |
+
size 5652
|
runs/Feb18_13-16-30_gpu3/events.out.tfevents.1739884598.gpu3.146287.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d58832c7405d4f9ca6ae1eba2969237e700041d29e05b19a8e13d23b8c8d073
|
3 |
+
size 5652
|
runs/Feb18_14-21-25_gpu3/events.out.tfevents.1739888488.gpu3.150125.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:350e1d72c4e34c695c268dfde44b8a5c82942650f05d0458c1c80a0a59f8b180
|
3 |
+
size 4184
|
runs/Feb18_14-22-35_gpu3/events.out.tfevents.1739888558.gpu3.150383.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a374a8acb75436ade461e245f4c0748266dbf4bac1d24fc9295b13d10a0218
|
3 |
+
size 6759
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b199eb3f42b0b628b1bba35888769aff274eb6b3aaca151bc4400e5f110ea759
|
3 |
+
size 5304
|