Fitsum Gaim commited on
Commit
d1cf1d2
1 Parent(s): 0320faa
Files changed (4) hide show
  1. all_results.json +0 -17
  2. eval_results.json +0 -12
  3. train_results.json +0 -8
  4. trainer_state.json +0 -79
all_results.json DELETED
@@ -1,17 +0,0 @@
1
- {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.828,
4
- "eval_f1": 0.8476527900797165,
5
- "eval_loss": 0.679597795009613,
6
- "eval_precision": 0.760731319554849,
7
- "eval_recall": 0.957,
8
- "eval_runtime": 16.0366,
9
- "eval_samples": 4000,
10
- "eval_samples_per_second": 249.429,
11
- "eval_steps_per_second": 7.795,
12
- "train_loss": 0.23406425937416991,
13
- "train_runtime": 1839.4116,
14
- "train_samples": 49562,
15
- "train_samples_per_second": 80.833,
16
- "train_steps_per_second": 2.526
17
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
eval_results.json DELETED
@@ -1,12 +0,0 @@
1
- {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.828,
4
- "eval_f1": 0.8476527900797165,
5
- "eval_loss": 0.679597795009613,
6
- "eval_precision": 0.760731319554849,
7
- "eval_recall": 0.957,
8
- "eval_runtime": 16.0366,
9
- "eval_samples": 4000,
10
- "eval_samples_per_second": 249.429,
11
- "eval_steps_per_second": 7.795
12
- }
 
 
 
 
 
 
 
 
 
 
 
 
train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 3.0,
3
- "train_loss": 0.23406425937416991,
4
- "train_runtime": 1839.4116,
5
- "train_samples": 49562,
6
- "train_samples_per_second": 80.833,
7
- "train_steps_per_second": 2.526
8
- }
 
 
 
 
 
 
 
 
trainer_state.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
- "global_step": 4647,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.32,
12
- "learning_rate": 1.78480740262535e-05,
13
- "loss": 0.4305,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 0.65,
18
- "learning_rate": 1.5696148052506995e-05,
19
- "loss": 0.3478,
20
- "step": 1000
21
- },
22
- {
23
- "epoch": 0.97,
24
- "learning_rate": 1.3544222078760491e-05,
25
- "loss": 0.3352,
26
- "step": 1500
27
- },
28
- {
29
- "epoch": 1.29,
30
- "learning_rate": 1.139229610501399e-05,
31
- "loss": 0.2272,
32
- "step": 2000
33
- },
34
- {
35
- "epoch": 1.61,
36
- "learning_rate": 9.240370131267486e-06,
37
- "loss": 0.2143,
38
- "step": 2500
39
- },
40
- {
41
- "epoch": 1.94,
42
- "learning_rate": 7.088444157520982e-06,
43
- "loss": 0.202,
44
- "step": 3000
45
- },
46
- {
47
- "epoch": 2.26,
48
- "learning_rate": 4.936518183774478e-06,
49
- "loss": 0.147,
50
- "step": 3500
51
- },
52
- {
53
- "epoch": 2.58,
54
- "learning_rate": 2.7845922100279753e-06,
55
- "loss": 0.122,
56
- "step": 4000
57
- },
58
- {
59
- "epoch": 2.91,
60
- "learning_rate": 6.32666236281472e-07,
61
- "loss": 0.1166,
62
- "step": 4500
63
- },
64
- {
65
- "epoch": 3.0,
66
- "step": 4647,
67
- "total_flos": 9780232594314240.0,
68
- "train_loss": 0.23406425937416991,
69
- "train_runtime": 1839.4116,
70
- "train_samples_per_second": 80.833,
71
- "train_steps_per_second": 2.526
72
- }
73
- ],
74
- "max_steps": 4647,
75
- "num_train_epochs": 3,
76
- "total_flos": 9780232594314240.0,
77
- "trial_name": null,
78
- "trial_params": null
79
- }