mmanikanta commited on
Commit
545a75f
1 Parent(s): 5b4602c

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.9874,
4
- "eval_loss": 0.034222181886434555,
5
- "eval_runtime": 60.0131,
6
- "eval_samples_per_second": 166.63,
7
- "eval_steps_per_second": 5.216,
8
- "total_flos": 2.23628338666187e+19,
9
- "train_loss": 0.1441501469903786,
10
- "train_runtime": 13283.8875,
11
- "train_samples_per_second": 67.751,
12
- "train_steps_per_second": 0.529
13
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.9833333333333333,
4
+ "eval_loss": 0.04612118750810623,
5
+ "eval_runtime": 108.8524,
6
+ "eval_samples_per_second": 275.602,
7
+ "eval_steps_per_second": 8.617,
8
+ "total_flos": 1.73991922900992e+19,
9
+ "train_loss": 0.15263754843139998,
10
+ "train_runtime": 7208.4995,
11
+ "train_samples_per_second": 97.108,
12
+ "train_steps_per_second": 0.759
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.9874,
4
- "eval_loss": 0.034222181886434555,
5
- "eval_runtime": 60.0131,
6
- "eval_samples_per_second": 166.63,
7
- "eval_steps_per_second": 5.216
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.9833333333333333,
4
+ "eval_loss": 0.04612118750810623,
5
+ "eval_runtime": 108.8524,
6
+ "eval_samples_per_second": 275.602,
7
+ "eval_steps_per_second": 8.617
8
  }
runs/Apr20_16-04-35_d1e86387316e/events.out.tfevents.1713637357.d1e86387316e.395.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c34655e59c12c79c92ffe6760960cac4bea3b1f78b7e0abec145b3715554687
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "total_flos": 2.23628338666187e+19,
4
- "train_loss": 0.1441501469903786,
5
- "train_runtime": 13283.8875,
6
- "train_samples_per_second": 67.751,
7
- "train_steps_per_second": 0.529
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "total_flos": 1.73991922900992e+19,
4
+ "train_loss": 0.15263754843139998,
5
+ "train_runtime": 7208.4995,
6
+ "train_samples_per_second": 97.108,
7
+ "train_steps_per_second": 0.759
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff