t5-small-nl24-finnish / small_nl24_pretrain.gin
aapot's picture
Try avoid hf hub git rate limits
09eb1bf
# Register necessary SeqIO Tasks/Mixtures.
from __gin__ import dynamic_registration
from t5x import utils
import tasks
import __main__ as train_script
include 'small_nl24.gin'
include 't5x/configs/runs/pretrain.gin'
# ------------------- Training specification overrides --------------------------
train_script.train:
eval_period = 10000
utils.SaveCheckpointConfig:
period = 10000
keep = 10
MIXTURE_OR_TASK_NAME = "pretrain_finnish"
USE_CACHED_TASKS = False
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
TRAIN_STEPS = 500000
DROPOUT_RATE = 0.0
BATCH_SIZE = 256