mt5-base-qgen / start_qgen.sh
nbroad's picture
nbroad HF staff
Upload start_qgen.sh
1c58869
#! /usr/bin/env bash
python run_summarization_flax.py \
--output_dir ./mt5-base-qgen \
--model_name_or_path google/mt5-base \
--tokenizer_name google/mt5-base \
--pretokenized \
--train_file asdf.csv \
--text_column context \
--summary_column question \
--do_train \
--do_eval \
--num_train_epochs 4 \
--learning_rate 5e-5 --warmup_steps 1000 \
--dtype bfloat16 \
--per_device_train_batch_size 4 \
--per_device_eval_batch_size 4 \
--overwrite_output_dir \
--max_source_length 1024 \
--max_target_length 64 \
--push_to_hub