mt5-small-trimmed-it-itquad-qg / trainer_config.json
asahi417's picture
model update
b9be7ac
raw
history blame
367 Bytes
{"dataset_path": "lmqg/qg_itquad", "dataset_name": "default", "input_types": "paragraph_answer", "output_types": "question", "prefix_types": null, "model": "vocabtrimmer/mt5-small-trimmed-it", "max_length": 512, "max_length_output": 32, "epoch": 14, "batch": 32, "lr": 0.001, "fp16": false, "random_seed": 1, "gradient_accumulation_steps": 2, "label_smoothing": 0.15}