bwebs commited on
Commit
1d42776
1 Parent(s): c6d4493

Training in progress, step 17

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c7a59da2efa72379bcc54eca155c61485a34016dc472390837f7e6667e1f381
3
  size 1044539653
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab7fcf96f319e26d9237e7aff6ad22c9c56adf34ea983de61ca6e41477e69855
3
  size 1044539653
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af06f840a430ad15f2b92f42be6568a6abc831744cb2250fd9b9ac18ef863ec
3
  size 5018531153
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:512f018b467c169e2aa0e142ea191b73786d79604dace238e3d4834d1df266e8
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3236c10f0630265339ef1aa6795f2331531941c060942cafc2e403641dc426
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ecb4b4bc15e0509048b47d006eba35fc56dec209d6d90c42b552a5ead63d9d9
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16ad615861470fd875e71876be305dededf7011ade3ed6da4cc2aabc41bda690
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89ce2185c6877d072e8ca86c937358d8e8317963d32ce90379cdc35bd6460cdf
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e76b66bdd086927b026285b23e5d38dff5415e1889470b91fef3e2e48c4f1583
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.25,
5
- "global_step": 13,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -84,11 +84,35 @@
84
  "learning_rate": 0.0002,
85
  "loss": 0.6422,
86
  "step": 13
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
87
  }
88
  ],
89
  "max_steps": 500,
90
  "num_train_epochs": 125,
91
- "total_flos": 2168782279802880.0,
92
  "trial_name": null,
93
  "trial_params": null
94
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.25,
5
+ "global_step": 17,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
84
  "learning_rate": 0.0002,
85
  "loss": 0.6422,
86
  "step": 13
87
+ },
88
+ {
89
+ "epoch": 3.5,
90
+ "learning_rate": 0.0002,
91
+ "loss": 0.6023,
92
+ "step": 14
93
+ },
94
+ {
95
+ "epoch": 3.75,
96
+ "learning_rate": 0.0002,
97
+ "loss": 0.5078,
98
+ "step": 15
99
+ },
100
+ {
101
+ "epoch": 4.0,
102
+ "learning_rate": 0.0002,
103
+ "loss": 0.5033,
104
+ "step": 16
105
+ },
106
+ {
107
+ "epoch": 4.25,
108
+ "learning_rate": 0.0002,
109
+ "loss": 0.4317,
110
+ "step": 17
111
  }
112
  ],
113
  "max_steps": 500,
114
  "num_train_epochs": 125,
115
+ "total_flos": 2835286102376448.0,
116
  "trial_name": null,
117
  "trial_params": null
118
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
3
  size 5018531153
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af06f840a430ad15f2b92f42be6568a6abc831744cb2250fd9b9ac18ef863ec
3
  size 5018531153
runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20ae9a3f24920171c22cccb9e05be58bfecabaa437ec9df242a7dd0a1a1bd2bf
3
- size 6522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80957985bf14a4ea6ae6bdf815ad3c111edbe74af26a336a0bd78adfd0239245
3
+ size 7138