File size: 712 Bytes
ece75fb 6087912 ece75fb f0adc7d ece75fb 3eb8262 ece75fb d2e0660 ece75fb 6087912 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 |
python run_clm_mp.py \
--model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
--tokenizer_name /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
--train_file /mnt/disks/flaxdisk/corpus/social_train.json \
--validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
--do_train \
--do_eval \
--block_size 1024 \
--num_train_epochs 5 \
--learning_rate 4e-6 \
--per_device_train_batch_size 2 \
--per_device_eval_batch_size 2 \
--overwrite_output_dir \
--output_dir "./" \
--cache_dir /mnt/disks/flaxdisk/cache/ \
--preprocessing_num_workers 96 \
--dtype bfloat16 \
--logging_steps 5000 \
--eval_steps 5000 \
--push_to_hub
|