File size: 618 Bytes
e565538 ebb3343 e565538 ebb3343 e565538 ebb3343 e565538 ebb3343 e565538 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
python3 run_dnlm_flax.py \
--output_dir "." \
--overwrite_output_dir \
--dataset_path NbAiLab/NCC2 \
--config_name rotobart \
--tokenizer_name vocab-2/the_pile.model \
--shuffle_buffer_size 100_000 \
--do_train --do_eval \
--max_seq_length 1024 \
--encoder_layers 12 \
--decoder_layers 12 \
--per_device_train_batch_size 1 \
--per_device_eval_batch_size 1 \
--logging_steps 8 \
--num_train_steps 100000 \
--eval_steps 10000 \
--save_steps 10000 \
--num_eval_samples 500 \
--warmup_steps 5000 \
--learning_rate 1e-4 \
--auth_token True \
--save_strategy steps \
--use_bf16 \
|