g8a9 commited on
Commit
fb5a889
1 Parent(s): cf8be5e

End of training

Browse files
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 31.18,
3
- "eval_accuracy": 0.1376987935196624,
4
- "eval_loss": 6.486697196960449,
5
- "eval_runtime": 169.2274,
6
  "eval_samples": 24055,
7
- "eval_samples_per_second": 142.146,
8
- "eval_steps_per_second": 2.222,
9
- "perplexity": 656.351978052217,
10
- "train_loss": 6.89371246590102,
11
- "train_runtime": 29548.4223,
12
  "train_samples": 24910,
13
- "train_samples_per_second": 33.721,
14
- "train_steps_per_second": 0.263
15
  }
 
1
  {
2
+ "epoch": 89.58,
3
+ "eval_accuracy": 0.5148013040185571,
4
+ "eval_loss": 2.73911714553833,
5
+ "eval_runtime": 145.896,
6
  "eval_samples": 24055,
7
+ "eval_samples_per_second": 164.878,
8
+ "eval_steps_per_second": 5.154,
9
+ "perplexity": 15.47331837619993,
10
+ "train_loss": 3.7431876293448516,
11
+ "train_runtime": 42244.2763,
12
  "train_samples": 24910,
13
+ "train_samples_per_second": 58.967,
14
+ "train_steps_per_second": 0.114
15
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 31.18,
3
- "eval_accuracy": 0.1376987935196624,
4
- "eval_loss": 6.486697196960449,
5
- "eval_runtime": 169.2274,
6
  "eval_samples": 24055,
7
- "eval_samples_per_second": 142.146,
8
- "eval_steps_per_second": 2.222,
9
- "perplexity": 656.351978052217
10
  }
 
1
  {
2
+ "epoch": 89.58,
3
+ "eval_accuracy": 0.5148013040185571,
4
+ "eval_loss": 2.73911714553833,
5
+ "eval_runtime": 145.896,
6
  "eval_samples": 24055,
7
+ "eval_samples_per_second": 164.878,
8
+ "eval_steps_per_second": 5.154,
9
+ "perplexity": 15.47331837619993
10
  }
runs/Feb14_00-12-10_monica.sm.unibocconi.it/events.out.tfevents.1676372443.monica.sm.unibocconi.it.4164817.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26625321fb87508e6806a980245d911e5f14945900233a180200a73b51d5fcc8
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 31.18,
3
- "train_loss": 6.89371246590102,
4
- "train_runtime": 29548.4223,
5
  "train_samples": 24910,
6
- "train_samples_per_second": 33.721,
7
- "train_steps_per_second": 0.263
8
  }
 
1
  {
2
+ "epoch": 89.58,
3
+ "train_loss": 3.7431876293448516,
4
+ "train_runtime": 42244.2763,
5
  "train_samples": 24910,
6
+ "train_samples_per_second": 58.967,
7
+ "train_steps_per_second": 0.114
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff