mt5-small-qgen / start_qgen.sh
nbroad's picture
nbroad HF staff
Saving weights and logs of epoch 0
1455619
#! /usr/bin/env bash
python run_summarization_flax.py \
--output_dir ./ \
--model_name_or_path google/mt5-small \
--tokenizer_name google/mt5-small \
--train_file qgen_train.csv \
--validation_file qgen_val.csv \
--text_column context \
--summary_column question \
--do_train \
--do_eval \
--num_train_epochs 3 \
--eval_steps 2000 \
--logging_steps 100 \
--learning_rate 5e-5 --warmup_steps 1000 \
--per_device_train_batch_size 2 \
--per_device_eval_batch_size 2 \
--overwrite_output_dir \
--max_source_length 1024 --max_target_length 64 \
--push_to_hub