marcderbauer commited on
Commit
e6040b0
1 Parent(s): 96e99f1

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +22 -60
trainer_state.json CHANGED
@@ -1,84 +1,46 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.142857142857143,
5
- "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_loss": 2.3697612285614014,
13
- "eval_runtime": 53.7583,
14
- "eval_samples_per_second": 4.874,
15
- "eval_steps_per_second": 0.614,
16
- "step": 140
17
  },
18
  {
19
  "epoch": 2.0,
20
- "eval_loss": 2.350198745727539,
21
- "eval_runtime": 52.6608,
22
- "eval_samples_per_second": 4.975,
23
- "eval_steps_per_second": 0.627,
24
- "step": 280
25
  },
26
  {
27
  "epoch": 3.0,
28
- "eval_loss": 2.6000664234161377,
29
- "eval_runtime": 51.3966,
30
- "eval_samples_per_second": 5.098,
31
- "eval_steps_per_second": 0.642,
32
- "step": 420
33
  },
34
  {
35
- "epoch": 3.57,
36
- "learning_rate": 1.2857142857142859e-05,
37
- "loss": 1.8394,
38
  "step": 500
39
- },
40
- {
41
- "epoch": 4.0,
42
- "eval_loss": 3.011274576187134,
43
- "eval_runtime": 51.1881,
44
- "eval_samples_per_second": 5.118,
45
- "eval_steps_per_second": 0.645,
46
- "step": 560
47
- },
48
- {
49
- "epoch": 5.0,
50
- "eval_loss": 3.5172500610351562,
51
- "eval_runtime": 53.2278,
52
- "eval_samples_per_second": 4.922,
53
- "eval_steps_per_second": 0.62,
54
- "step": 700
55
- },
56
- {
57
- "epoch": 6.0,
58
- "eval_loss": 3.840390682220459,
59
- "eval_runtime": 53.3892,
60
- "eval_samples_per_second": 4.907,
61
- "eval_steps_per_second": 0.618,
62
- "step": 840
63
- },
64
- {
65
- "epoch": 7.0,
66
- "eval_loss": 4.020865440368652,
67
- "eval_runtime": 52.1972,
68
- "eval_samples_per_second": 5.019,
69
- "eval_steps_per_second": 0.632,
70
- "step": 980
71
- },
72
- {
73
- "epoch": 7.14,
74
- "learning_rate": 5.7142857142857145e-06,
75
- "loss": 0.4408,
76
- "step": 1000
77
  }
78
  ],
79
- "max_steps": 1400,
80
  "num_train_epochs": 10,
81
- "total_flos": 1857413971968000.0,
82
  "trial_name": null,
83
  "trial_params": null
84
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.048780487804878,
5
+ "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_loss": 1.8646807670593262,
13
+ "eval_runtime": 68.8052,
14
+ "eval_samples_per_second": 4.709,
15
+ "eval_steps_per_second": 0.596,
16
+ "step": 164
17
  },
18
  {
19
  "epoch": 2.0,
20
+ "eval_loss": 1.8987102508544922,
21
+ "eval_runtime": 70.9224,
22
+ "eval_samples_per_second": 4.568,
23
+ "eval_steps_per_second": 0.578,
24
+ "step": 328
25
  },
26
  {
27
  "epoch": 3.0,
28
+ "eval_loss": 2.09053373336792,
29
+ "eval_runtime": 65.7815,
30
+ "eval_samples_per_second": 4.925,
31
+ "eval_steps_per_second": 0.623,
32
+ "step": 492
33
  },
34
  {
35
+ "epoch": 3.05,
36
+ "learning_rate": 1.3902439024390244e-05,
37
+ "loss": 1.6067,
38
  "step": 500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
+ "max_steps": 1640,
42
  "num_train_epochs": 10,
43
+ "total_flos": 925920865026048.0,
44
  "trial_name": null,
45
  "trial_params": null
46
  }