cybershiptrooper's picture
add ioi edges and rename model names
0355bdd
raw
history blame
372 Bytes
{"next_token": true, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 256, "lr": 0.001, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "clip_grad_norm": 1.0, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4}