Bingsu commited on
Commit
4986591
1 Parent(s): 15dbab9

Update train.sh

Browse files
Files changed (1) hide show
  1. train.sh +6 -5
train.sh CHANGED
@@ -1,9 +1,12 @@
 
 
1
  python run_mlm.py \
2
  --model_name_or_path Bingsu/my_mobilebert_untrained \
3
- --dataset_name Bingsu/my-korean-training-corpus-half \
 
4
  --per_device_train_batch_size 16 \
5
  --per_device_eval_batch_size 16 \
6
- --gradient_accumulation_steps 16 \
7
  --max_steps 1000000 \
8
  --lr_scheduler_type cosine_with_restarts \
9
  --warmup_ratio 0.05 \
@@ -17,6 +20,4 @@ python run_mlm.py \
17
  --push_to_hub \
18
  --hub_strategy checkpoint \
19
  --output_dir mobilebert_ko \
20
- --overwrite_output_dir \
21
- --gradient_checkpointing \
22
- --use_auth_token
 
1
+ export HF_DATASETS_CACHE="/workspace/.cache/huggingface/datasets"
2
+
3
  python run_mlm.py \
4
  --model_name_or_path Bingsu/my_mobilebert_untrained \
5
+ --train_file train.txt \
6
+ --validation_file val.txt \
7
  --per_device_train_batch_size 16 \
8
  --per_device_eval_batch_size 16 \
9
+ --gradient_accumulation_steps 2 \
10
  --max_steps 1000000 \
11
  --lr_scheduler_type cosine_with_restarts \
12
  --warmup_ratio 0.05 \
 
20
  --push_to_hub \
21
  --hub_strategy checkpoint \
22
  --output_dir mobilebert_ko \
23
+ --overwrite_output_dir