masatochi commited on
Commit
7c67960
1 Parent(s): 70d5ab3

Training in progress, step 145, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab2e0910ee8ff17a681acdd56f9074e96fa82a916a8f3239bf3f1f3cd80ce465
3
  size 59827904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6232ed48b9c18e085faf4119484b73bc66018b47f3bd50b5a6e541e5ccc1e03
3
  size 59827904
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13e25365edc54422e82cbac4c671e2435e8bbd2900af3e9044725a0b51ab79a1
3
  size 30875540
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b26583c118f37f0f901f941c1caddee16c708cd7a19dc546b58c02f36d2f5862
3
  size 30875540
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3620fd05065514f79fda6c0faf379ce93ec4350e71e2f2104721a44e9230ff6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b362eff1a75d9bf020525cb57285e4b861253ed25664be12ca93f1935aca2a48
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:671828e69cd8fd42106344a5797cbc78f701a434a6386d9dfacd16451ba179aa
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be04ea4bc9f159499b4a7b296b15e0c0e5c54743663ee8550a26340683f89e32
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.06846384253316218,
5
  "eval_steps": 34,
6
- "global_step": 140,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1027,6 +1027,41 @@
1027
  "learning_rate": 5.542616442234618e-05,
1028
  "loss": 10.4222,
1029
  "step": 140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1030
  }
1031
  ],
1032
  "logging_steps": 1,
@@ -1046,7 +1081,7 @@
1046
  "attributes": {}
1047
  }
1048
  },
1049
- "total_flos": 3.086271546340147e+17,
1050
  "train_batch_size": 3,
1051
  "trial_name": null,
1052
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.0709089797664894,
5
  "eval_steps": 34,
6
+ "global_step": 145,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1027
  "learning_rate": 5.542616442234618e-05,
1028
  "loss": 10.4222,
1029
  "step": 140
1030
+ },
1031
+ {
1032
+ "epoch": 0.06895286997982762,
1033
+ "grad_norm": Infinity,
1034
+ "learning_rate": 5.37796116459687e-05,
1035
+ "loss": 9.8649,
1036
+ "step": 141
1037
+ },
1038
+ {
1039
+ "epoch": 0.06944189742649307,
1040
+ "grad_norm": Infinity,
1041
+ "learning_rate": 5.214884308987136e-05,
1042
+ "loss": 10.3785,
1043
+ "step": 142
1044
+ },
1045
+ {
1046
+ "epoch": 0.06993092487315851,
1047
+ "grad_norm": Infinity,
1048
+ "learning_rate": 5.0534415660022136e-05,
1049
+ "loss": 9.2483,
1050
+ "step": 143
1051
+ },
1052
+ {
1053
+ "epoch": 0.07041995231982395,
1054
+ "grad_norm": Infinity,
1055
+ "learning_rate": 4.893688068190932e-05,
1056
+ "loss": 10.5841,
1057
+ "step": 144
1058
+ },
1059
+ {
1060
+ "epoch": 0.0709089797664894,
1061
+ "grad_norm": Infinity,
1062
+ "learning_rate": 4.735678371226441e-05,
1063
+ "loss": 8.9077,
1064
+ "step": 145
1065
  }
1066
  ],
1067
  "logging_steps": 1,
 
1081
  "attributes": {}
1082
  }
1083
  },
1084
+ "total_flos": 3.1964955301380096e+17,
1085
  "train_batch_size": 3,
1086
  "trial_name": null,
1087
  "trial_params": null