Sean Lee commited on
Commit
160dcbe
1 Parent(s): 96d6283

best checkpoint (epoch:8)

Browse files
Files changed (2) hide show
  1. checkpoint-best.pth +3 -0
  2. log.txt +10 -0
checkpoint-best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7141c4e471263ff5a3305b268bd6941bc76c5bf815852a17d4ee2fbab859861
3
+ size 8488275180
log.txt ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.00020000000000000006, "train_min_lr": 1e-05, "train_loss": 334.56927541286404, "train_loss_scale": 221.92876292608196, "train_weight_decay": 0.009999999999999653, "train_grad_norm": NaN, "val_score": 59.041523986537705, "epoch": 0, "n_parameters": 707252188}
2
+ {"train_lr": 0.0003961660489081072, "train_min_lr": 1.9808302445405316e-05, "train_loss": 1.9752057734826933, "train_loss_scale": 947.0823439295289, "train_weight_decay": 0.009999999999999653, "train_grad_norm": 3.1552694289906187, "val_score": 62.28285535002408, "epoch": 1, "n_parameters": 707252188}
3
+ {"train_lr": 0.0003737128171630595, "train_min_lr": 1.8685640858152984e-05, "train_loss": 1.8990879598574575, "train_loss_scale": 8082.449125494702, "train_weight_decay": 0.010000000000000404, "train_grad_norm": Infinity, "val_score": 63.01712325022101, "epoch": 2, "n_parameters": 707252188}
4
+ {"train_lr": 0.0003315137691950233, "train_min_lr": 1.6575688459751186e-05, "train_loss": 1.8262149314001939, "train_loss_scale": 6119.161496233883, "train_weight_decay": 0.010000000000000404, "train_grad_norm": NaN, "val_score": 63.82619865452318, "epoch": 3, "n_parameters": 707252188}
5
+ {"train_lr": 0.00027465836730983267, "train_min_lr": 1.3732918365491597e-05, "train_loss": 1.7515122664015852, "train_loss_scale": 8362.470573215882, "train_weight_decay": 0.010000000000000404, "train_grad_norm": NaN, "val_score": 64.04780251925395, "epoch": 4, "n_parameters": 707252188}
6
+ {"train_lr": 0.0002100042120712058, "train_min_lr": 1.0500210603560317e-05, "train_loss": 1.6776694345524465, "train_loss_scale": 11152.74964892123, "train_weight_decay": 0.010000000000000404, "train_grad_norm": Infinity, "val_score": 64.31713756404511, "epoch": 5, "n_parameters": 707252188}
7
+ {"train_lr": 0.00014534954879462784, "train_min_lr": 7.2674774397314005e-06, "train_loss": 1.6121363192321119, "train_loss_scale": 10199.996936039832, "train_weight_decay": 0.010000000000000404, "train_grad_norm": NaN, "val_score": 64.47763272725284, "epoch": 6, "n_parameters": 707252188}
8
+ {"train_lr": 8.84926840724596e-05, "train_min_lr": 4.424634203622975e-06, "train_loss": 1.5584008516871, "train_loss_scale": 7565.546789225074, "train_weight_decay": 0.010000000000000404, "train_grad_norm": Infinity, "val_score": 64.52279537409952, "epoch": 7, "n_parameters": 707252188}
9
+ {"train_lr": 4.6291394908147905e-05, "train_min_lr": 2.3145697454074018e-06, "train_loss": 1.5199955951531363, "train_loss_scale": 8462.870420017873, "train_weight_decay": 0.010000000000000404, "train_grad_norm": NaN, "val_score": 64.51048802327892, "epoch": 8, "n_parameters": 707252188}
10
+ {"train_lr": 2.3835779599604868e-05, "train_min_lr": 1.191788979980233e-06, "train_loss": 1.4975423570448878, "train_loss_scale": 9759.701774543597, "train_weight_decay": 0.010000000000000404, "train_grad_norm": NaN, "val_score": 64.44887987250063, "epoch": 9, "n_parameters": 707252188}