QinLiuNLP
/

llama3-sudo

alignment-handbook

Generated from Trainer

Model card Files Files and versions Metrics Training metrics Community

Qin Liu commited on Aug 13, 2024

Commit

10734f1

·

verified ·

1 Parent(s): d74a4f8

End of training

Files changed (2) hide show

README.md +4 -2
config.json +2 -2

README.md CHANGED Viewed

@@ -1,11 +1,13 @@
 ---
 base_model: meta-llama/Meta-Llama-3-8B
 library_name: peft
 license: llama3
 tags:
 - trl
 - sft
-- alignment-handbook
 - generated_from_trainer
 model-index:
 - name: llama3-sudo
@@ -17,7 +19,7 @@ should probably proofread and complete it, then remove this comment. -->
 # llama3-sudo
-This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.0709

 ---
 base_model: meta-llama/Meta-Llama-3-8B
+datasets:
+- HuggingFaceH4/ultrachat_200k
 library_name: peft
 license: llama3
 tags:
+- alignment-handbook
 - trl
 - sft
 - generated_from_trainer
 model-index:
 - name: llama3-sudo
 # llama3-sudo
+This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on the HuggingFaceH4/ultrachat_200k dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.0709

config.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-  "_name_or_path": "meta-llama/Meta-Llama-3-8B-Instruct",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
-  "eos_token_id": 128009,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,

 {
+  "_name_or_path": "meta-llama/Meta-Llama-3-8B",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
+  "eos_token_id": 128001,
   "hidden_act": "silu",
   "hidden_size": 4096,
   "initializer_range": 0.02,