crystina-z commited on
Commit
8071540
1 Parent(s): 5edd862

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +28 -0
README.md ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Tevatron
2
+
3
+ ```
4
+ bs=512
5
+ epoch=40
6
+
7
+ save_steps=4000
8
+ backbone=bert-base-multilingual-cased
9
+ output_dir=mlm.bs-$bs.epoch-$epoch.$backbone
10
+
11
+ WANDB_PROJECT=mlm-mrtydi-DDR \
12
+ python examples/dense-adapter/dense-adapter-train.py \
13
+ --output_dir $output_dir \
14
+ --model_name_or_path $backbone \
15
+ --tokenizer_name bert-base-multilingual-cased \
16
+ --save_steps $save_steps \
17
+ --dataset_name Tevatron/msmarco-passage \
18
+ --fp16 \
19
+ --per_device_train_batch_size $bs \
20
+ --train_n_passages 2 \
21
+ --learning_rate 1e-5 \
22
+ --q_max_len 32 \
23
+ --p_max_len 128 \
24
+ --num_train_epochs $epoch \
25
+ --logging_steps 100 \
26
+ --overwrite_output_dir \
27
+ --dataloader_num_workers 4 \
28
+ ```