zkdeng commited on
Commit
18dcbbc
·
verified ·
1 Parent(s): f623d87

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -5,11 +5,11 @@
5
  "eval_loss": 0.4917445778846741,
6
  "eval_precision": 0.9019841269841271,
7
  "eval_recall": 0.888888888888889,
8
- "eval_runtime": 2.8796,
9
- "eval_samples_per_second": 17.363,
10
- "eval_steps_per_second": 1.389,
11
- "train_loss": 0.8048010190327962,
12
- "train_runtime": 101.246,
13
- "train_samples_per_second": 19.606,
14
  "train_steps_per_second": 0.296
15
  }
 
5
  "eval_loss": 0.4917445778846741,
6
  "eval_precision": 0.9019841269841271,
7
  "eval_recall": 0.888888888888889,
8
+ "eval_runtime": 2.7009,
9
+ "eval_samples_per_second": 18.512,
10
+ "eval_steps_per_second": 1.481,
11
+ "train_loss": 0.8048010031382243,
12
+ "train_runtime": 101.5046,
13
+ "train_samples_per_second": 19.556,
14
  "train_steps_per_second": 0.296
15
  }
eval_results.json CHANGED
@@ -4,7 +4,7 @@
4
  "eval_loss": 0.4917445778846741,
5
  "eval_precision": 0.9019841269841271,
6
  "eval_recall": 0.888888888888889,
7
- "eval_runtime": 2.8796,
8
- "eval_samples_per_second": 17.363,
9
- "eval_steps_per_second": 1.389
10
  }
 
4
  "eval_loss": 0.4917445778846741,
5
  "eval_precision": 0.9019841269841271,
6
  "eval_recall": 0.888888888888889,
7
+ "eval_runtime": 2.7009,
8
+ "eval_samples_per_second": 18.512,
9
+ "eval_steps_per_second": 1.481
10
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1a39cfc8adad56bf2ee22ca8629aa0029137a9500168ee7d233da5e00e31526
3
  size 111550573
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45472aab20ab139959ef06b6fd6e930443066f347b6c459a418f7ecb7be4843a
3
  size 111550573
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 4.8,
3
- "train_loss": 0.8048010190327962,
4
- "train_runtime": 101.246,
5
- "train_samples_per_second": 19.606,
6
  "train_steps_per_second": 0.296
7
  }
 
1
  {
2
  "epoch": 4.8,
3
+ "train_loss": 0.8048010031382243,
4
+ "train_runtime": 101.5046,
5
+ "train_samples_per_second": 19.556,
6
  "train_steps_per_second": 0.296
7
  }
trainer_state.json CHANGED
@@ -15,9 +15,9 @@
15
  "eval_loss": 1.1803159713745117,
16
  "eval_precision": 0.6789160839160839,
17
  "eval_recall": 0.6868831168831169,
18
- "eval_runtime": 3.3618,
19
- "eval_samples_per_second": 14.873,
20
- "eval_steps_per_second": 1.19,
21
  "step": 6
22
  },
23
  {
@@ -30,24 +30,24 @@
30
  "epoch": 1.92,
31
  "eval_accuracy": 0.84,
32
  "eval_f1": 0.8387969924812031,
33
- "eval_loss": 0.7862006425857544,
34
  "eval_precision": 0.8603030303030303,
35
  "eval_recall": 0.856969696969697,
36
- "eval_runtime": 2.7831,
37
- "eval_samples_per_second": 17.966,
38
- "eval_steps_per_second": 1.437,
39
  "step": 12
40
  },
41
  {
42
  "epoch": 2.88,
43
  "eval_accuracy": 0.9,
44
  "eval_f1": 0.9023978919631095,
45
- "eval_loss": 0.5749024748802185,
46
  "eval_precision": 0.9034848484848486,
47
  "eval_recall": 0.9103030303030304,
48
- "eval_runtime": 2.6475,
49
- "eval_samples_per_second": 18.886,
50
- "eval_steps_per_second": 1.511,
51
  "step": 18
52
  },
53
  {
@@ -60,12 +60,12 @@
60
  "epoch": 4.0,
61
  "eval_accuracy": 0.9,
62
  "eval_f1": 0.9023978919631095,
63
- "eval_loss": 0.47980964183807373,
64
  "eval_precision": 0.9034848484848486,
65
  "eval_recall": 0.9103030303030304,
66
- "eval_runtime": 2.685,
67
- "eval_samples_per_second": 18.622,
68
- "eval_steps_per_second": 1.49,
69
  "step": 25
70
  },
71
  {
@@ -78,21 +78,21 @@
78
  "epoch": 4.8,
79
  "eval_accuracy": 0.9,
80
  "eval_f1": 0.9023978919631095,
81
- "eval_loss": 0.46124908328056335,
82
  "eval_precision": 0.9034848484848486,
83
  "eval_recall": 0.9103030303030304,
84
- "eval_runtime": 2.7597,
85
- "eval_samples_per_second": 18.118,
86
- "eval_steps_per_second": 1.449,
87
  "step": 30
88
  },
89
  {
90
  "epoch": 4.8,
91
  "step": 30,
92
  "total_flos": 1.4114178534172262e+17,
93
- "train_loss": 0.8048010190327962,
94
- "train_runtime": 101.246,
95
- "train_samples_per_second": 19.606,
96
  "train_steps_per_second": 0.296
97
  }
98
  ],
 
15
  "eval_loss": 1.1803159713745117,
16
  "eval_precision": 0.6789160839160839,
17
  "eval_recall": 0.6868831168831169,
18
+ "eval_runtime": 3.4169,
19
+ "eval_samples_per_second": 14.633,
20
+ "eval_steps_per_second": 1.171,
21
  "step": 6
22
  },
23
  {
 
30
  "epoch": 1.92,
31
  "eval_accuracy": 0.84,
32
  "eval_f1": 0.8387969924812031,
33
+ "eval_loss": 0.7862005829811096,
34
  "eval_precision": 0.8603030303030303,
35
  "eval_recall": 0.856969696969697,
36
+ "eval_runtime": 2.6641,
37
+ "eval_samples_per_second": 18.768,
38
+ "eval_steps_per_second": 1.501,
39
  "step": 12
40
  },
41
  {
42
  "epoch": 2.88,
43
  "eval_accuracy": 0.9,
44
  "eval_f1": 0.9023978919631095,
45
+ "eval_loss": 0.5749024152755737,
46
  "eval_precision": 0.9034848484848486,
47
  "eval_recall": 0.9103030303030304,
48
+ "eval_runtime": 2.6511,
49
+ "eval_samples_per_second": 18.86,
50
+ "eval_steps_per_second": 1.509,
51
  "step": 18
52
  },
53
  {
 
60
  "epoch": 4.0,
61
  "eval_accuracy": 0.9,
62
  "eval_f1": 0.9023978919631095,
63
+ "eval_loss": 0.47980961203575134,
64
  "eval_precision": 0.9034848484848486,
65
  "eval_recall": 0.9103030303030304,
66
+ "eval_runtime": 2.6994,
67
+ "eval_samples_per_second": 18.523,
68
+ "eval_steps_per_second": 1.482,
69
  "step": 25
70
  },
71
  {
 
78
  "epoch": 4.8,
79
  "eval_accuracy": 0.9,
80
  "eval_f1": 0.9023978919631095,
81
+ "eval_loss": 0.4612491726875305,
82
  "eval_precision": 0.9034848484848486,
83
  "eval_recall": 0.9103030303030304,
84
+ "eval_runtime": 2.6906,
85
+ "eval_samples_per_second": 18.583,
86
+ "eval_steps_per_second": 1.487,
87
  "step": 30
88
  },
89
  {
90
  "epoch": 4.8,
91
  "step": 30,
92
  "total_flos": 1.4114178534172262e+17,
93
+ "train_loss": 0.8048010031382243,
94
+ "train_runtime": 101.5046,
95
+ "train_samples_per_second": 19.556,
96
  "train_steps_per_second": 0.296
97
  }
98
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ab3212533198c3de7e5dda4341f6ae79dafe0f3ee0a05e1d3c333c0f4df3a6a
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c51a483b7010c9031af33c45a848c04fac70447e17aacfc4ec922618a70f1b6
3
  size 4155