File size: 516 Bytes
32dc2d8
a96f44d
5ca30e6
a96f44d
5ca30e6
 
a96f44d
32dc2d8
5ca30e6
 
650ecb1
3cccb01
650ecb1
32dc2d8
 
650ecb1
 
074c5e1
63249ac
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
python run_seq2seq_flax.py \
	--dataset_repo_or_path dalle-mini/encoded \
	--train_file **/train/CC3M/*.jsonl \
	--validation_file **/valid/*/*.jsonl \
	--len_train 129847128 \
	--len_eval 157312 \
	--streaming \
	--output_dir output \
	--per_device_train_batch_size 16 \
	--per_device_eval_batch_size 16 \
	--preprocessing_num_workers 80 \
	--warmup_steps 125 \
	--gradient_accumulation_steps 8 \
	--do_train \
	--do_eval \
	--adafactor \
	--num_train_epochs 1 \
	--max_train_samples 10000 \
	--learning_rate 0.005