Qin Liu commited on
Commit
d0cb34d
1 Parent(s): eb31b09

Training in progress, step 75

Browse files
README.md CHANGED
@@ -1,11 +1,13 @@
1
  ---
2
  base_model: meta-llama/Meta-Llama-3-8B
 
 
3
  library_name: peft
4
  license: llama3
5
  tags:
 
6
  - trl
7
  - sft
8
- - alignment-handbook
9
  - generated_from_trainer
10
  model-index:
11
  - name: llama3-sudo
@@ -17,7 +19,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  # llama3-sudo
19
 
20
- This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on an unknown dataset.
21
  It achieves the following results on the evaluation set:
22
  - Loss: 1.0709
23
 
 
1
  ---
2
  base_model: meta-llama/Meta-Llama-3-8B
3
+ datasets:
4
+ - HuggingFaceH4/ultrachat_200k
5
  library_name: peft
6
  license: llama3
7
  tags:
8
+ - alignment-handbook
9
  - trl
10
  - sft
 
11
  - generated_from_trainer
12
  model-index:
13
  - name: llama3-sudo
 
19
 
20
  # llama3-sudo
21
 
22
+ This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on the HuggingFaceH4/ultrachat_200k dataset.
23
  It achieves the following results on the evaluation set:
24
  - Loss: 1.0709
25
 
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "k_proj",
24
  "down_proj",
25
- "o_proj",
26
- "q_proj",
27
  "v_proj",
28
  "gate_proj",
29
- "up_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "down_proj",
 
 
24
  "v_proj",
25
  "gate_proj",
26
+ "q_proj",
27
+ "up_proj",
28
+ "o_proj",
29
+ "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c5d3d6ecfbbafb1f7f9d5d5266e75a74558d41cf12a70edea301f2ebb05a32f
3
  size 31516744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad134c422e64503fd2453b15cbc3b5282376314193c5b72ae709ebc8d1d8cb7
3
  size 31516744
runs/Aug13_19-05-34_ip-172-31-10-237/events.out.tfevents.1723575945.ip-172-31-10-237.662759.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0a2e9501d49f2d39c1fe0716f1be50b5989245fe1dcc36ac2a948563b50e9f9
3
+ size 5758
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef2cf294a0941096dc386e43b0615197a851de050108383ef1b8c57a6788d26a
3
  size 6904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c99b33a61873ee90046c0f4b37c5fbe4914334128aec99b883a988415fb7ab5f
3
  size 6904