bwebs commited on
Commit
c6d4493
1 Parent(s): 330773d

Training in progress, step 13

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3afa61eeb036c0e6f83ebee42770c4ccabfb8c42fc5d11ffd4d42b8c40ccf3ba
3
  size 1044539653
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c7a59da2efa72379bcc54eca155c61485a34016dc472390837f7e6667e1f381
3
  size 1044539653
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98921f6735e9439448aa91c97aeb9156937de45eb28fd8fe2c6741b342b379f3
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
3
  size 5018531153
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:806511f3992549d6b23d7bb63c8a34a9a4101dfc09d578b75a4830edd1994881
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512f018b467c169e2aa0e142ea191b73786d79604dace238e3d4834d1df266e8
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff7f6d0ea2b6d04fce321db9d270a15a73873a32f3e79ddedac5fb877ae6bd45
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ecb4b4bc15e0509048b47d006eba35fc56dec209d6d90c42b552a5ead63d9d9
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3c0d70efc3a97da83ba1d6d51480c35c82f8635b66f83a6c9d16b65aacd4c51
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89ce2185c6877d072e8ca86c937358d8e8317963d32ce90379cdc35bd6460cdf
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.25,
5
- "global_step": 9,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -60,11 +60,35 @@
60
  "learning_rate": 0.0002,
61
  "loss": 1.1174,
62
  "step": 9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
  "max_steps": 500,
66
  "num_train_epochs": 125,
67
- "total_flos": 1502278457229312.0,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.25,
5
+ "global_step": 13,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
60
  "learning_rate": 0.0002,
61
  "loss": 1.1174,
62
  "step": 9
63
+ },
64
+ {
65
+ "epoch": 2.5,
66
+ "learning_rate": 0.0002,
67
+ "loss": 0.9802,
68
+ "step": 10
69
+ },
70
+ {
71
+ "epoch": 2.75,
72
+ "learning_rate": 0.0002,
73
+ "loss": 0.8965,
74
+ "step": 11
75
+ },
76
+ {
77
+ "epoch": 3.0,
78
+ "learning_rate": 0.0002,
79
+ "loss": 0.7951,
80
+ "step": 12
81
+ },
82
+ {
83
+ "epoch": 3.25,
84
+ "learning_rate": 0.0002,
85
+ "loss": 0.6422,
86
+ "step": 13
87
  }
88
  ],
89
  "max_steps": 500,
90
  "num_train_epochs": 125,
91
+ "total_flos": 2168782279802880.0,
92
  "trial_name": null,
93
  "trial_params": null
94
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98921f6735e9439448aa91c97aeb9156937de45eb28fd8fe2c6741b342b379f3
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
3
  size 5018531153
runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24418f91a6e09e6a9d11e75617cb8f6497ae5ed5400e4400a56468aec2554f92
3
- size 5906
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20ae9a3f24920171c22cccb9e05be58bfecabaa437ec9df242a7dd0a1a1bd2bf
3
+ size 6522