Spaces:

inflaton-ai
/

logical-reasoning

Build error

+### model
+model_name_or_path: hfl/llama-3-chinese-8b-instruct-v3
+### method
+stage: sft
+do_train: true
+finetuning_type: lora
+lora_target: all
+# quantization_bit: 4                     # use 4-bit QLoRA
+loraplus_lr_ratio: 16.0                 # use LoRA+ with lambda=16.0
+# use_unsloth: true                       # use UnslothAI's LoRA optimization for 2x faster training
+upcast_layernorm: true
+### dataset
+dataset: alpaca_mgtv_p1
+template: llama3
+cutoff_len: 4096
+max_samples: 25000
+overwrite_cache: true
+preprocessing_num_workers: 16
+### output
+output_dir: saves/llama3-8b/lora/sft_bf16_p1_full_r3
+logging_steps: 10
+save_steps: 35
+plot_loss: true
+# overwrite_output_dir: true
+### train
+per_device_train_batch_size: 16
+gradient_accumulation_steps: 8
+learning_rate: 1.0e-4
+num_train_epochs: 1.0
+lr_scheduler_type: cosine
+warmup_ratio: 0.1
+bf16: true
+ddp_timeout: 180000000
+### eval
+val_size: 0.1
+per_device_eval_batch_size: 1
+eval_strategy: steps
+eval_steps: 35
+report_to: wandb
+run_name: llama3_8b_p1_full_r3 # optional

llama-factory/config/llama3-8b_lora_sft_bf16-p2_r3.yaml ADDED Viewed

+### model
+model_name_or_path: hfl/llama-3-chinese-8b-instruct-v3
+### method
+stage: sft
+do_train: true
+finetuning_type: lora
+lora_target: all
+# quantization_bit: 4                     # use 4-bit QLoRA
+loraplus_lr_ratio: 16.0                 # use LoRA+ with lambda=16.0
+# use_unsloth: true                       # use UnslothAI's LoRA optimization for 2x faster training
+upcast_layernorm: true
+### dataset
+dataset: alpaca_mgtv_p2
+template: llama3
+cutoff_len: 4096
+max_samples: 25000
+overwrite_cache: true
+preprocessing_num_workers: 16
+### output
+output_dir: saves/llama3-8b/lora/sft_bf16_p2_full_r3
+logging_steps: 10
+save_steps: 35
+plot_loss: true
+# overwrite_output_dir: true
+### train
+per_device_train_batch_size: 16
+gradient_accumulation_steps: 8
+learning_rate: 1.0e-4
+num_train_epochs: 1.0
+lr_scheduler_type: cosine
+warmup_ratio: 0.1
+bf16: true
+ddp_timeout: 180000000
+### eval
+val_size: 0.1
+per_device_eval_batch_size: 1
+eval_strategy: steps
+eval_steps: 35
+report_to: wandb
+run_name: llama3_8b_p2_full_r3 # optional

results/mgtv-llama3_p1_en_full_metrics.csv ADDED Viewed

+epoch,model,accuracy,precision,recall,f1
+0.3333333333333333,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-117_torch.bfloat16_lf,0.6486666666666666,0.6525934632970077,0.6486666666666666,0.6312721163517108
+0.6666666666666666,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-234_torch.bfloat16_lf,0.561,0.6897096276142071,0.561,0.6083393704375663
+1.0,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-351_torch.bfloat16_lf,0.621,0.686842945161901,0.621,0.6417441253605001

results/mgtv-llama3_p2_en_full_metrics.csv ADDED Viewed

+epoch,model,accuracy,precision,recall,f1
+0.3333333333333333,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-117_torch.bfloat16_lf,0.6203333333333333,0.663582082981778,0.6203333333333333,0.6363626392286635
+0.6666666666666666,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-234_torch.bfloat16_lf,0.5613333333333334,0.7000506187405509,0.5613333333333334,0.6113039056178092
+1.0,meta-llama/Meta-Llama-3-8B-Instruct/checkpoint-351_torch.bfloat16_lf,0.6203333333333333,0.6819200833733873,0.6203333333333333,0.6405153767205392

scripts/eval-mgtv-llama3_8b.sh CHANGED Viewed

@@ -21,17 +21,19 @@ export RESIZE_TOKEN_EMBEDDINGS=true
 export START_EPOCH=0
 export USING_LLAMA_FACTORY=true
-export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat
 export MODEL_PREFIX=llama3-8b_lora_sft_bf16
-export LOGICAL_REASONING_RESULTS_PATH=results/$MODEL_PREFIX-p1_r2.csv
-export ADAPTER_PATH_BASE=llama-factory/saves/llama3-8b/lora/sft_bf16_p1_full_r2
 export USING_P1_PROMPT_TEMPLATE=true
 echo "Eval $MODEL_NAME with $ADAPTER_PATH_BASE"
 python llm_toolkit/eval_logical_reasoning_all_epochs.py
-export LOGICAL_REASONING_RESULTS_PATH=results/$MODEL_PREFIX-p2_r2.csv
-export ADAPTER_PATH_BASE=llama-factory/saves/llama3-8b/lora/sft_bf16_p2_full_r2
 export USING_P1_PROMPT_TEMPLATE=false
 echo "Eval $MODEL_NAME with $ADAPTER_PATH_BASE"
 python llm_toolkit/eval_logical_reasoning_all_epochs.py

 export START_EPOCH=0
 export USING_LLAMA_FACTORY=true
+# export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat
+export MODEL_NAME=hfl/llama-3-chinese-8b-instruct-v3
 export MODEL_PREFIX=llama3-8b_lora_sft_bf16
+export LOGICAL_REASONING_RESULTS_PATH=results/$MODEL_PREFIX-p1_r3.csv
+export ADAPTER_PATH_BASE=llama-factory/saves/llama3-8b/lora/sft_bf16_p1_full_r3
 export USING_P1_PROMPT_TEMPLATE=true
 echo "Eval $MODEL_NAME with $ADAPTER_PATH_BASE"
 python llm_toolkit/eval_logical_reasoning_all_epochs.py
+export LOGICAL_REASONING_RESULTS_PATH=results/$MODEL_PREFIX-p2_r3.csv
+export ADAPTER_PATH_BASE=llama-factory/saves/llama3-8b/lora/sft_bf16_p2_full_r3
 export USING_P1_PROMPT_TEMPLATE=false
 echo "Eval $MODEL_NAME with $ADAPTER_PATH_BASE"
 python llm_toolkit/eval_logical_reasoning_all_epochs.py

scripts/tune-mgtv-llama3_8b.sh CHANGED Viewed

@@ -25,12 +25,12 @@ export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat
 export MODEL_PREFIX=llama3-8b_lora_sft_bf16
-export CONFIG_FILE=config/$MODEL_PREFIX-p1_r2.yaml
 echo "Tuning $MODEL_NAME with $CONFIG_FILE"
 $BASEDIR/scripts/tune-lf.sh $CONFIG_FILE
-export CONFIG_FILE=config/$MODEL_PREFIX-p2_r2.yaml
 echo "Tuning $MODEL_NAME with $CONFIG_FILE"
 $BASEDIR/scripts/tune-lf.sh $CONFIG_FILE

 export MODEL_PREFIX=llama3-8b_lora_sft_bf16
+export CONFIG_FILE=config/$MODEL_PREFIX-p1_r3.yaml
 echo "Tuning $MODEL_NAME with $CONFIG_FILE"
 $BASEDIR/scripts/tune-lf.sh $CONFIG_FILE
+export CONFIG_FILE=config/$MODEL_PREFIX-p2_r3.yaml
 echo "Tuning $MODEL_NAME with $CONFIG_FILE"
 $BASEDIR/scripts/tune-lf.sh $CONFIG_FILE