|
#! /usr/bin/env bash |
|
|
|
python run_summarization_flax.py \ |
|
--output_dir ./mt5-base-qgen \ |
|
--model_name_or_path google/mt5-base \ |
|
--tokenizer_name google/mt5-base \ |
|
--pretokenized \ |
|
--train_file asdf.csv \ |
|
--text_column context \ |
|
--summary_column question \ |
|
--do_train \ |
|
--do_eval \ |
|
--num_train_epochs 4 \ |
|
--learning_rate 5e-5 --warmup_steps 1000 \ |
|
--dtype bfloat16 \ |
|
--per_device_train_batch_size 4 \ |
|
--per_device_eval_batch_size 4 \ |
|
--overwrite_output_dir \ |
|
--max_source_length 1024 \ |
|
--max_target_length 64 \ |
|
--push_to_hub |