bwebs commited on
Commit
330773d
1 Parent(s): 8cccd7e

Training in progress, step 9

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c32be757f0288a7c67461a859c5f4d72e961a7d5c562d0fa1664c73de6c8154
3
  size 1044539653
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3afa61eeb036c0e6f83ebee42770c4ccabfb8c42fc5d11ffd4d42b8c40ccf3ba
3
  size 1044539653
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:816a60f80d1cb9952d19b233fc387797608aafd271895e74c640a0a12d4a308e
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98921f6735e9439448aa91c97aeb9156937de45eb28fd8fe2c6741b342b379f3
3
  size 5018531153
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ad35f6fad5899e2120c58dd6f8e19da6576502e2471f7fbb0d8f573b5b8c4cd
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:806511f3992549d6b23d7bb63c8a34a9a4101dfc09d578b75a4830edd1994881
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4226304fb62e961f1febc70be2db3d4aa0fa092f6ffb6147df348b679da41079
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff7f6d0ea2b6d04fce321db9d270a15a73873a32f3e79ddedac5fb877ae6bd45
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfad7054a4f055c4b3d58bee7c17c677cfc1a348a8f81a9063089f8cb55dc31e
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3c0d70efc3a97da83ba1d6d51480c35c82f8635b66f83a6c9d16b65aacd4c51
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.25,
5
- "global_step": 5,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -36,11 +36,35 @@
36
  "learning_rate": 0.0002,
37
  "loss": 1.5316,
38
  "step": 5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "max_steps": 500,
42
  "num_train_epochs": 125,
43
- "total_flos": 835774634655744.0,
44
  "trial_name": null,
45
  "trial_params": null
46
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.25,
5
+ "global_step": 9,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
36
  "learning_rate": 0.0002,
37
  "loss": 1.5316,
38
  "step": 5
39
+ },
40
+ {
41
+ "epoch": 1.5,
42
+ "learning_rate": 0.0002,
43
+ "loss": 1.4856,
44
+ "step": 6
45
+ },
46
+ {
47
+ "epoch": 1.75,
48
+ "learning_rate": 0.0002,
49
+ "loss": 1.3389,
50
+ "step": 7
51
+ },
52
+ {
53
+ "epoch": 2.0,
54
+ "learning_rate": 0.0002,
55
+ "loss": 1.2343,
56
+ "step": 8
57
+ },
58
+ {
59
+ "epoch": 2.25,
60
+ "learning_rate": 0.0002,
61
+ "loss": 1.1174,
62
+ "step": 9
63
  }
64
  ],
65
  "max_steps": 500,
66
  "num_train_epochs": 125,
67
+ "total_flos": 1502278457229312.0,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:816a60f80d1cb9952d19b233fc387797608aafd271895e74c640a0a12d4a308e
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98921f6735e9439448aa91c97aeb9156937de45eb28fd8fe2c6741b342b379f3
3
  size 5018531153
runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a1ff8931a8754e3d54dd36950dce6cd0ee70d0b9b8e7bd51c1948bdf67c08b2
3
- size 5290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24418f91a6e09e6a9d11e75617cb8f6497ae5ed5400e4400a56468aec2554f92
3
+ size 5906