File size: 714 Bytes
ece75fb
6087912
 
 
 
ece75fb
 
 
f0adc7d
ece75fb
3eb8262
 
ece75fb
d2e0660
ece75fb
6087912
 
07f4ae9
 
6087912
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
python run_clm_mp.py \
    	--model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
  	--tokenizer_name /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
   	--train_file /mnt/disks/flaxdisk/corpus/social_train.json \
       	--validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
     	--do_train \
       	--do_eval  \
     	--block_size 1024 \
   	--num_train_epochs 5 \
   	--learning_rate 4e-6 \
	--per_device_train_batch_size 2 \
       	--per_device_eval_batch_size 2 \
    	--overwrite_output_dir \
	--output_dir "./" \
	--cache_dir /mnt/disks/flaxdisk/cache/ \
	--preprocessing_num_workers 96 \
	--dtype bfloat16 \
   	--logging_steps 50000 \
       	--eval_steps 50000 \
	--push_to_hub