mt5-small-qgen / start_qgen.sh
nbroad's picture
nbroad HF staff
Upload start_qgen.sh
d816f2e
raw
history blame
No virus
485 Bytes
python run_summarization_flax.py \
--output_dir ./mt5-base-qgen \
--model_name_or_path google/mt5-base \
--tokenizer_name google/mt5-base \
--train_file qgen_training_data.csv \
--text_column context \
--summary_column question \
--do_train
--num_train_epochs 3 \
--learning_rate 5e-5 --warmup_steps 300 \
--per_device_train_batch_size 2 \
--per_device_eval_batch_size 2 \
--overwrite_output_dir \
--max_source_length 1024 --max_target_length 64 \
--push_to_hub