Update albert_xxlargev1_sqd2_512.sh
Browse files- albert_xxlargev1_sqd2_512.sh +34 -0
albert_xxlargev1_sqd2_512.sh
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#!/bin/bash
|
2 |
+
|
3 |
+
export OMP_NUM_THREADS=12
|
4 |
+
EXAMPLES=/media/dn/work2/nlpu/transformers/examples
|
5 |
+
SQUAD=${EXAMPLES}/scripts/squad2.0
|
6 |
+
MODEL_PATH=${EXAMPLES}/scripts/runs/albert_xxlargev1_squad2_512_bs48_3ep_fp16
|
7 |
+
|
8 |
+
python ${EXAMPLES}/question-answering/run_squad.py \
|
9 |
+
--model_type albert \
|
10 |
+
--model_name_or_path albert-xxlarge-v1 \
|
11 |
+
--do_train \
|
12 |
+
--do_eval \
|
13 |
+
--train_file ${SQUAD}/train-v2.0.json \
|
14 |
+
--predict_file ${SQUAD}/dev-v2.0.json \
|
15 |
+
--version_2_with_negative \
|
16 |
+
--do_lower_case \
|
17 |
+
--num_train_epochs 3 \
|
18 |
+
--max_steps 8144 \
|
19 |
+
--warmup_steps 814 \
|
20 |
+
--learning_rate 3e-5 \
|
21 |
+
--max_seq_length 512 \
|
22 |
+
--doc_stride 128 \
|
23 |
+
--per_gpu_train_batch_size 6 \
|
24 |
+
--gradient_accumulation_steps 8 \
|
25 |
+
--per_gpu_eval_batch_size 48 \
|
26 |
+
--fp16 \
|
27 |
+
--fp16_opt_level O1 \
|
28 |
+
--threads 12 \
|
29 |
+
--logging_steps 50 \
|
30 |
+
--save_steps 3000 \
|
31 |
+
--overwrite_output_dir \
|
32 |
+
--output_dir ${MODEL_PATH}
|
33 |
+
$@
|
34 |
+
|