File size: 915 Bytes
dc9ca7d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
# export NCCL_P2P_DISABLE="1"
# export NCCL_IB_DISABLE="1"
export OMP_NUM_THREADS=1
export ACCELERATE_LOG_LEVEL=info
export WANDB_PROJECT='Mistral-DPO'
export WANDB_ENTITY="ckip"
output_dir="DPO/CHT-6_20240715-1255"
# Check if the directory does not exist
if [ -d ${output_dir} ]; then
echo "The directory already exists."
exit
fi
mkdir -p ${output_dir}
current_script=$0
cp ${current_script} ${output_dir}
accelerate launch \
--config_file alignment-handbook/recipes/accelerate_configs/deepspeed_zero3.yaml \
--num_processes 4 \
test_dpo.py \
"dpo_config_full.yaml" \
--load_in_4bit=false \
--logging_steps=1 \
--model_name_or_path="/share/home/models/CHT-Mistral-7B/CHT-6/" \
--train_file="data/training_ptt_dpo-include_id-converted.jsonl" \
--validation_file="data/testing_ptt_dpo_include_id-converted.jsonl" \
--cache_dir="cache_dir" \
--output_dir=${output_dir} \
| tee ${output_dir}/trainin.log
|