Jeska commited on
Commit
d596030
1 Parent(s): eeba265

End of training

Browse files
all_results.json CHANGED
@@ -2,13 +2,13 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.6322020292282104,
4
  "eval_loss": 1.8354707956314087,
5
- "eval_runtime": 2.5103,
6
  "eval_samples": 1267,
7
- "eval_samples_per_second": 504.724,
8
- "eval_steps_per_second": 63.339,
9
  "train_loss": 2.186672953385506,
10
- "train_runtime": 425.0347,
11
  "train_samples": 11651,
12
- "train_samples_per_second": 82.236,
13
- "train_steps_per_second": 10.284
14
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.6322020292282104,
4
  "eval_loss": 1.8354707956314087,
5
+ "eval_runtime": 2.4427,
6
  "eval_samples": 1267,
7
+ "eval_samples_per_second": 518.682,
8
+ "eval_steps_per_second": 65.091,
9
  "train_loss": 2.186672953385506,
10
+ "train_runtime": 418.7818,
11
  "train_samples": 11651,
12
+ "train_samples_per_second": 83.464,
13
+ "train_steps_per_second": 10.437
14
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.6322020292282104,
4
  "eval_loss": 1.8354707956314087,
5
- "eval_runtime": 2.5103,
6
  "eval_samples": 1267,
7
- "eval_samples_per_second": 504.724,
8
- "eval_steps_per_second": 63.339
9
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.6322020292282104,
4
  "eval_loss": 1.8354707956314087,
5
+ "eval_runtime": 2.4427,
6
  "eval_samples": 1267,
7
+ "eval_samples_per_second": 518.682,
8
+ "eval_steps_per_second": 65.091
9
  }
runs/Dec02_08-22-15_jbuhmann/events.out.tfevents.1638433351.jbuhmann.9189.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9774331878ff5301a1e9fd93116dfb7092e48388c04ea7737a88365af7e03fe9
3
- size 18578
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81e74fdc5cbf34bdef782f4407b38337903cb8a0428b73e8260c1dc41258f19
3
+ size 18932
runs/Dec02_08-22-15_jbuhmann/events.out.tfevents.1638433774.jbuhmann.9189.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4fdd40baa8f0e13710423415631c18d17c3ba1a24d319042a5017fbfdee22da
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.186672953385506,
4
- "train_runtime": 425.0347,
5
  "train_samples": 11651,
6
- "train_samples_per_second": 82.236,
7
- "train_steps_per_second": 10.284
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.186672953385506,
4
+ "train_runtime": 418.7818,
5
  "train_samples": 11651,
6
+ "train_samples_per_second": 83.464,
7
+ "train_steps_per_second": 10.437
8
  }
trainer_state.json CHANGED
@@ -23,9 +23,9 @@
23
  "epoch": 1.0,
24
  "eval_accuracy": 0.5406472086906433,
25
  "eval_loss": 2.3865766525268555,
26
- "eval_runtime": 2.5099,
27
- "eval_samples_per_second": 504.808,
28
- "eval_steps_per_second": 63.35,
29
  "step": 1457
30
  },
31
  {
@@ -50,9 +50,9 @@
50
  "epoch": 2.0,
51
  "eval_accuracy": 0.6069455146789551,
52
  "eval_loss": 1.9364700317382812,
53
- "eval_runtime": 2.445,
54
- "eval_samples_per_second": 518.202,
55
- "eval_steps_per_second": 65.031,
56
  "step": 2914
57
  },
58
  {
@@ -77,9 +77,9 @@
77
  "epoch": 3.0,
78
  "eval_accuracy": 0.6322020292282104,
79
  "eval_loss": 1.8354707956314087,
80
- "eval_runtime": 2.4438,
81
- "eval_samples_per_second": 518.46,
82
- "eval_steps_per_second": 65.063,
83
  "step": 4371
84
  },
85
  {
@@ -87,9 +87,9 @@
87
  "step": 4371,
88
  "total_flos": 1151412634864512.0,
89
  "train_loss": 2.186672953385506,
90
- "train_runtime": 425.0347,
91
- "train_samples_per_second": 82.236,
92
- "train_steps_per_second": 10.284
93
  }
94
  ],
95
  "max_steps": 4371,
 
23
  "epoch": 1.0,
24
  "eval_accuracy": 0.5406472086906433,
25
  "eval_loss": 2.3865766525268555,
26
+ "eval_runtime": 2.3607,
27
+ "eval_samples_per_second": 536.704,
28
+ "eval_steps_per_second": 67.353,
29
  "step": 1457
30
  },
31
  {
 
50
  "epoch": 2.0,
51
  "eval_accuracy": 0.6069455146789551,
52
  "eval_loss": 1.9364700317382812,
53
+ "eval_runtime": 2.4048,
54
+ "eval_samples_per_second": 526.856,
55
+ "eval_steps_per_second": 66.117,
56
  "step": 2914
57
  },
58
  {
 
77
  "epoch": 3.0,
78
  "eval_accuracy": 0.6322020292282104,
79
  "eval_loss": 1.8354707956314087,
80
+ "eval_runtime": 2.3743,
81
+ "eval_samples_per_second": 533.633,
82
+ "eval_steps_per_second": 66.967,
83
  "step": 4371
84
  },
85
  {
 
87
  "step": 4371,
88
  "total_flos": 1151412634864512.0,
89
  "train_loss": 2.186672953385506,
90
+ "train_runtime": 418.7818,
91
+ "train_samples_per_second": 83.464,
92
+ "train_steps_per_second": 10.437
93
  }
94
  ],
95
  "max_steps": 4371,