raptorkwok commited on
Commit
1e8d67b
1 Parent(s): 2fbbc3b

End of training

Browse files
all_results.json CHANGED
@@ -2,14 +2,14 @@
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.796813717099257,
4
  "eval_loss": 1.4686633348464966,
5
- "eval_runtime": 1598.4891,
6
  "eval_samples": 71199,
7
- "eval_samples_per_second": 44.541,
8
- "eval_steps_per_second": 1.392,
9
  "perplexity": 4.3434255536068305,
10
  "train_loss": 1.455913220122233,
11
- "train_runtime": 35811.6134,
12
  "train_samples": 1353936,
13
- "train_samples_per_second": 37.807,
14
- "train_steps_per_second": 1.181
15
  }
 
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.796813717099257,
4
  "eval_loss": 1.4686633348464966,
5
+ "eval_runtime": 1595.6894,
6
  "eval_samples": 71199,
7
+ "eval_samples_per_second": 44.62,
8
+ "eval_steps_per_second": 1.394,
9
  "perplexity": 4.3434255536068305,
10
  "train_loss": 1.455913220122233,
11
+ "train_runtime": 36443.3148,
12
  "train_samples": 1353936,
13
+ "train_samples_per_second": 37.152,
14
+ "train_steps_per_second": 1.161
15
  }
eval_results.json CHANGED
@@ -2,9 +2,9 @@
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.796813717099257,
4
  "eval_loss": 1.4686633348464966,
5
- "eval_runtime": 1598.4891,
6
  "eval_samples": 71199,
7
- "eval_samples_per_second": 44.541,
8
- "eval_steps_per_second": 1.392,
9
  "perplexity": 4.3434255536068305
10
  }
 
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.796813717099257,
4
  "eval_loss": 1.4686633348464966,
5
+ "eval_runtime": 1595.6894,
6
  "eval_samples": 71199,
7
+ "eval_samples_per_second": 44.62,
8
+ "eval_steps_per_second": 1.394,
9
  "perplexity": 4.3434255536068305
10
  }
runs/Oct21_20-37-03_hkmustamd-Super-Server/events.out.tfevents.1729553061.hkmustamd-Super-Server.3374618.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dda7848145c90b1626014807c75dac9bdb3a7ebdc3099c9d837f3adab67fcc12
3
+ size 417
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 1.455913220122233,
4
- "train_runtime": 35811.6134,
5
  "train_samples": 1353936,
6
- "train_samples_per_second": 37.807,
7
- "train_steps_per_second": 1.181
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 1.455913220122233,
4
+ "train_runtime": 36443.3148,
5
  "train_samples": 1353936,
6
+ "train_samples_per_second": 37.152,
7
+ "train_steps_per_second": 1.161
8
  }
trainer_state.json CHANGED
@@ -516,9 +516,9 @@
516
  "step": 42311,
517
  "total_flos": 4.127720706618163e+17,
518
  "train_loss": 1.455913220122233,
519
- "train_runtime": 35811.6134,
520
- "train_samples_per_second": 37.807,
521
- "train_steps_per_second": 1.181
522
  }
523
  ],
524
  "max_steps": 42311,
 
516
  "step": 42311,
517
  "total_flos": 4.127720706618163e+17,
518
  "train_loss": 1.455913220122233,
519
+ "train_runtime": 36443.3148,
520
+ "train_samples_per_second": 37.152,
521
+ "train_steps_per_second": 1.161
522
  }
523
  ],
524
  "max_steps": 42311,