TeetouchQQ commited on
Commit
acc825b
1 Parent(s): 62f4876

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +43 -107
trainer_state.json CHANGED
@@ -1,136 +1,72 @@
1
  {
2
- "best_metric": 0.9636638164520264,
3
- "best_model_checkpoint": "microsoft-swin-base-patch4-window7-224_bert-base-multilingual-cased_bert-base-multilingual-cased/checkpoint-4473",
4
- "epoch": 9.0,
5
- "global_step": 4473,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 1.0,
12
- "eval_loss": 1.1897900104522705,
13
- "eval_runtime": 529.9619,
14
- "eval_samples_per_second": 4.689,
15
- "eval_steps_per_second": 0.236,
16
- "step": 497
17
- },
18
- {
19
- "epoch": 1.01,
20
- "learning_rate": 1.8997987927565392e-05,
21
- "loss": 1.4457,
22
  "step": 500
23
  },
24
  {
25
- "epoch": 2.0,
26
- "eval_loss": 1.0949503183364868,
27
- "eval_runtime": 30.0349,
28
- "eval_samples_per_second": 82.737,
29
- "eval_steps_per_second": 4.162,
30
- "step": 994
31
  },
32
  {
33
- "epoch": 2.01,
34
- "learning_rate": 1.799195171026157e-05,
35
- "loss": 1.1664,
36
  "step": 1000
37
  },
38
  {
39
- "epoch": 3.0,
40
- "eval_loss": 1.0486524105072021,
41
- "eval_runtime": 29.951,
42
- "eval_samples_per_second": 82.969,
43
- "eval_steps_per_second": 4.173,
44
- "step": 1491
45
  },
46
  {
47
- "epoch": 3.02,
48
- "learning_rate": 1.6985915492957746e-05,
49
- "loss": 1.0482,
50
  "step": 1500
51
  },
52
  {
53
- "epoch": 4.0,
54
- "eval_loss": 1.0101640224456787,
55
- "eval_runtime": 29.925,
56
- "eval_samples_per_second": 83.041,
57
- "eval_steps_per_second": 4.177,
58
- "step": 1988
59
  },
60
  {
61
- "epoch": 4.02,
62
- "learning_rate": 1.5979879275653925e-05,
63
- "loss": 0.9577,
64
  "step": 2000
65
  },
66
  {
67
- "epoch": 5.0,
68
- "eval_loss": 0.9930654168128967,
69
- "eval_runtime": 29.9623,
70
- "eval_samples_per_second": 82.938,
71
- "eval_steps_per_second": 4.172,
72
- "step": 2485
73
- },
74
- {
75
- "epoch": 5.03,
76
- "learning_rate": 1.4973843058350102e-05,
77
- "loss": 0.8946,
78
- "step": 2500
79
- },
80
- {
81
- "epoch": 6.0,
82
- "eval_loss": 0.9802634119987488,
83
- "eval_runtime": 30.0215,
84
- "eval_samples_per_second": 82.774,
85
- "eval_steps_per_second": 4.164,
86
- "step": 2982
87
- },
88
- {
89
- "epoch": 6.04,
90
- "learning_rate": 1.396780684104628e-05,
91
- "loss": 0.8387,
92
- "step": 3000
93
- },
94
- {
95
- "epoch": 7.0,
96
- "eval_loss": 0.9800927639007568,
97
- "eval_runtime": 29.9858,
98
- "eval_samples_per_second": 82.873,
99
- "eval_steps_per_second": 4.169,
100
- "step": 3479
101
- },
102
- {
103
- "epoch": 7.04,
104
- "learning_rate": 1.2961770623742455e-05,
105
- "loss": 0.7909,
106
- "step": 3500
107
- },
108
- {
109
- "epoch": 8.0,
110
- "eval_loss": 0.9686193466186523,
111
- "eval_runtime": 30.1165,
112
- "eval_samples_per_second": 82.513,
113
- "eval_steps_per_second": 4.151,
114
- "step": 3976
115
- },
116
- {
117
- "epoch": 8.05,
118
- "learning_rate": 1.1955734406438632e-05,
119
- "loss": 0.7463,
120
- "step": 4000
121
- },
122
- {
123
- "epoch": 9.0,
124
- "eval_loss": 0.9636638164520264,
125
- "eval_runtime": 30.0385,
126
- "eval_samples_per_second": 82.727,
127
- "eval_steps_per_second": 4.161,
128
- "step": 4473
129
  }
130
  ],
131
- "max_steps": 9940,
132
- "num_train_epochs": 20,
133
- "total_flos": 1.6290726869086323e+19,
134
  "trial_name": null,
135
  "trial_params": null
136
  }
 
1
  {
2
+ "best_metric": 0.8071129322052002,
3
+ "best_model_checkpoint": "microsoft-swin-base-patch4-window7-224_bert-base-multilingual-cased_bert-base-multilingual-cased/checkpoint-2496",
4
+ "epoch": 4.0,
5
+ "global_step": 2496,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.8,
12
+ "learning_rate": 3.680128205128205e-05,
13
+ "loss": 1.2658,
 
 
 
 
 
 
 
 
14
  "step": 500
15
  },
16
  {
17
+ "epoch": 1.0,
18
+ "eval_loss": 0.9458033442497253,
19
+ "eval_runtime": 118.6535,
20
+ "eval_samples_per_second": 21.028,
21
+ "eval_steps_per_second": 1.315,
22
+ "step": 624
23
  },
24
  {
25
+ "epoch": 1.6,
26
+ "learning_rate": 3.359615384615385e-05,
27
+ "loss": 0.9614,
28
  "step": 1000
29
  },
30
  {
31
+ "epoch": 2.0,
32
+ "eval_loss": 0.8532279133796692,
33
+ "eval_runtime": 29.6586,
34
+ "eval_samples_per_second": 84.124,
35
+ "eval_steps_per_second": 5.26,
36
+ "step": 1248
37
  },
38
  {
39
+ "epoch": 2.4,
40
+ "learning_rate": 3.0391025641025643e-05,
41
+ "loss": 0.8407,
42
  "step": 1500
43
  },
44
  {
45
+ "epoch": 3.0,
46
+ "eval_loss": 0.8248330354690552,
47
+ "eval_runtime": 29.4482,
48
+ "eval_samples_per_second": 84.725,
49
+ "eval_steps_per_second": 5.297,
50
+ "step": 1872
51
  },
52
  {
53
+ "epoch": 3.21,
54
+ "learning_rate": 2.718589743589744e-05,
55
+ "loss": 0.7485,
56
  "step": 2000
57
  },
58
  {
59
+ "epoch": 4.0,
60
+ "eval_loss": 0.8071129322052002,
61
+ "eval_runtime": 29.4796,
62
+ "eval_samples_per_second": 84.635,
63
+ "eval_steps_per_second": 5.292,
64
+ "step": 2496
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  }
66
  ],
67
+ "max_steps": 6240,
68
+ "num_train_epochs": 10,
69
+ "total_flos": 7.268007926746055e+18,
70
  "trial_name": null,
71
  "trial_params": null
72
  }