crystina-z
commited on
Commit
·
8071540
1
Parent(s):
5edd862
Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Tevatron
|
2 |
+
|
3 |
+
```
|
4 |
+
bs=512
|
5 |
+
epoch=40
|
6 |
+
|
7 |
+
save_steps=4000
|
8 |
+
backbone=bert-base-multilingual-cased
|
9 |
+
output_dir=mlm.bs-$bs.epoch-$epoch.$backbone
|
10 |
+
|
11 |
+
WANDB_PROJECT=mlm-mrtydi-DDR \
|
12 |
+
python examples/dense-adapter/dense-adapter-train.py \
|
13 |
+
--output_dir $output_dir \
|
14 |
+
--model_name_or_path $backbone \
|
15 |
+
--tokenizer_name bert-base-multilingual-cased \
|
16 |
+
--save_steps $save_steps \
|
17 |
+
--dataset_name Tevatron/msmarco-passage \
|
18 |
+
--fp16 \
|
19 |
+
--per_device_train_batch_size $bs \
|
20 |
+
--train_n_passages 2 \
|
21 |
+
--learning_rate 1e-5 \
|
22 |
+
--q_max_len 32 \
|
23 |
+
--p_max_len 128 \
|
24 |
+
--num_train_epochs $epoch \
|
25 |
+
--logging_steps 100 \
|
26 |
+
--overwrite_output_dir \
|
27 |
+
--dataloader_num_workers 4 \
|
28 |
+
```
|