mmanikanta commited on
Commit
00e2b2f
1 Parent(s): f036c7b

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.9901,
4
- "eval_loss": 0.03231855481863022,
5
- "eval_runtime": 133.8531,
6
- "eval_samples_per_second": 74.709,
7
- "eval_steps_per_second": 4.669,
8
- "total_flos": 2.091911758043834e+19,
9
- "train_loss": 0.13970869080807824,
10
- "train_runtime": 10165.3024,
11
- "train_samples_per_second": 26.561,
12
- "train_steps_per_second": 0.415
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.9931,
4
+ "eval_loss": 0.02777969278395176,
5
+ "eval_runtime": 46.8321,
6
+ "eval_samples_per_second": 213.529,
7
+ "eval_steps_per_second": 13.346,
8
+ "total_flos": 6.9730391934794465e+19,
9
+ "train_loss": 0.0988586475932242,
10
+ "train_runtime": 11106.5671,
11
+ "train_samples_per_second": 81.033,
12
+ "train_steps_per_second": 1.266
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.9901,
4
- "eval_loss": 0.03231855481863022,
5
- "eval_runtime": 133.8531,
6
- "eval_samples_per_second": 74.709,
7
- "eval_steps_per_second": 4.669
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.9931,
4
+ "eval_loss": 0.02777969278395176,
5
+ "eval_runtime": 46.8321,
6
+ "eval_samples_per_second": 213.529,
7
+ "eval_steps_per_second": 13.346
8
  }
runs/Apr16_03-59-49_8252f766fecd/events.out.tfevents.1713251252.8252f766fecd.697.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d778641bf3daf9c895fda78c6be7594e36ddf1886466b01c5673a671e1f045b4
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 2.091911758043834e+19,
4
- "train_loss": 0.13970869080807824,
5
- "train_runtime": 10165.3024,
6
- "train_samples_per_second": 26.561,
7
- "train_steps_per_second": 0.415
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 6.9730391934794465e+19,
4
+ "train_loss": 0.0988586475932242,
5
+ "train_runtime": 11106.5671,
6
+ "train_samples_per_second": 81.033,
7
+ "train_steps_per_second": 1.266
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff