Chuanming
/

Mixtral-QLoRA-test

Mixtral-QLoRA-test / benchmark /benchmark_level2.sh

Upload folder using huggingface_hub

fa4458a about 1 year ago

1.25 kB

	# compound experiments: gpt2xl + grad_accu
	python benchmark/benchmark.py \
	--command "python examples/scripts/ppo.py --ppo_config.exp_name ppo_gpt2xl_grad_accu --ppo_config.model_name gpt2-xl --ppo_config.mini_batch_size 16 --ppo_config.gradient_accumulation_steps 8 --ppo_config.log_with wandb" \
	--num-seeds 3 \
	--start-seed 1 \
	--workers 10 \
	--slurm-nodes 1 \
	--slurm-gpus-per-task 1 \
	--slurm-ntasks 1 \
	--slurm-total-cpus 12 \
	--slurm-template-path benchmark/trl.slurm_template

	# compound experiments: Cerebras-GPT-6.7B + deepspeed zero2 + grad_accu
	python benchmark/benchmark.py \
	--command "accelerate launch --config_file examples/accelerate_configs/deepspeed_zero2.yaml examples/scripts/ppo.py --ppo_config.exp_name ppo_Cerebras-GPT-6.7B_grad_accu_deepspeed_stage2 --ppo_config.batch_size 32 --ppo_config.mini_batch_size 32 --ppo_config.log_with wandb --ppo_config.model_name cerebras/Cerebras-GPT-6.7B --ppo_config.reward_model sentiment-analysis:cerebras/Cerebras-GPT-6.7B" \
	--num-seeds 3 \
	--start-seed 1 \
	--workers 10 \
	--slurm-nodes 1 \
	--slurm-gpus-per-task 8 \
	--slurm-ntasks 1 \
	--slurm-total-cpus 90 \
	--slurm-template-path benchmark/trl.slurm_template