gchhablani commited on
Commit
c4d56b6
1 Parent(s): 02f836b

End of training

Browse files
all_results.json CHANGED
@@ -2,13 +2,13 @@
2
  "epoch": 3.0,
3
  "eval_loss": 0.624345064163208,
4
  "eval_matthews_correlation": 0.0,
5
- "eval_runtime": 22.759,
6
  "eval_samples": 1043,
7
- "eval_samples_per_second": 45.828,
8
- "eval_steps_per_second": 5.756,
9
  "train_loss": 0.6174308222552717,
10
- "train_runtime": 2056.4994,
11
  "train_samples": 8551,
12
- "train_samples_per_second": 12.474,
13
- "train_steps_per_second": 3.119
14
  }
2
  "epoch": 3.0,
3
  "eval_loss": 0.624345064163208,
4
  "eval_matthews_correlation": 0.0,
5
+ "eval_runtime": 22.7153,
6
  "eval_samples": 1043,
7
+ "eval_samples_per_second": 45.916,
8
+ "eval_steps_per_second": 5.767,
9
  "train_loss": 0.6174308222552717,
10
+ "train_runtime": 2128.6729,
11
  "train_samples": 8551,
12
+ "train_samples_per_second": 12.051,
13
+ "train_steps_per_second": 3.013
14
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 3.0,
3
  "eval_loss": 0.624345064163208,
4
  "eval_matthews_correlation": 0.0,
5
- "eval_runtime": 22.759,
6
  "eval_samples": 1043,
7
- "eval_samples_per_second": 45.828,
8
- "eval_steps_per_second": 5.756
9
  }
2
  "epoch": 3.0,
3
  "eval_loss": 0.624345064163208,
4
  "eval_matthews_correlation": 0.0,
5
+ "eval_runtime": 22.7153,
6
  "eval_samples": 1043,
7
+ "eval_samples_per_second": 45.916,
8
+ "eval_steps_per_second": 5.767
9
  }
runs/Oct09_09-15-18_patrick-general-gpu/events.out.tfevents.1633771761.patrick-general-gpu.40257.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a1c55e3805cf532df97873439b80d8b95b3cf5ba6054ded52d241a7f8f3b445
3
- size 4730
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c79b3d2229e3d03a39848c4880589b318982bc94503b5d564187889ac0dd174
3
+ size 5084
runs/Oct09_09-15-18_patrick-general-gpu/events.out.tfevents.1633773921.patrick-general-gpu.40257.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49e4134e023573d5076badfdd6b2f63837cff1de4feb259b3e10f3ea9e7a0a9d
3
+ size 375
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 0.6174308222552717,
4
- "train_runtime": 2056.4994,
5
  "train_samples": 8551,
6
- "train_samples_per_second": 12.474,
7
- "train_steps_per_second": 3.119
8
  }
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 0.6174308222552717,
4
+ "train_runtime": 2128.6729,
5
  "train_samples": 8551,
6
+ "train_samples_per_second": 12.051,
7
+ "train_steps_per_second": 3.013
8
  }
trainer_state.json CHANGED
@@ -17,9 +17,9 @@
17
  "epoch": 1.0,
18
  "eval_loss": 0.6526795029640198,
19
  "eval_matthews_correlation": 0.0,
20
- "eval_runtime": 22.9563,
21
- "eval_samples_per_second": 45.434,
22
- "eval_steps_per_second": 5.706,
23
  "step": 2138
24
  },
25
  {
@@ -32,9 +32,9 @@
32
  "epoch": 2.0,
33
  "eval_loss": 0.6258916258811951,
34
  "eval_matthews_correlation": 0.0,
35
- "eval_runtime": 22.8508,
36
- "eval_samples_per_second": 45.644,
37
- "eval_steps_per_second": 5.733,
38
  "step": 4276
39
  },
40
  {
@@ -47,9 +47,9 @@
47
  "epoch": 3.0,
48
  "eval_loss": 0.624345064163208,
49
  "eval_matthews_correlation": 0.0,
50
- "eval_runtime": 22.8559,
51
- "eval_samples_per_second": 45.634,
52
- "eval_steps_per_second": 5.732,
53
  "step": 6414
54
  },
55
  {
@@ -57,9 +57,9 @@
57
  "step": 6414,
58
  "total_flos": 1.6048929796061184e+16,
59
  "train_loss": 0.6174308222552717,
60
- "train_runtime": 2056.4994,
61
- "train_samples_per_second": 12.474,
62
- "train_steps_per_second": 3.119
63
  }
64
  ],
65
  "max_steps": 6414,
17
  "epoch": 1.0,
18
  "eval_loss": 0.6526795029640198,
19
  "eval_matthews_correlation": 0.0,
20
+ "eval_runtime": 22.9461,
21
+ "eval_samples_per_second": 45.454,
22
+ "eval_steps_per_second": 5.709,
23
  "step": 2138
24
  },
25
  {
32
  "epoch": 2.0,
33
  "eval_loss": 0.6258916258811951,
34
  "eval_matthews_correlation": 0.0,
35
+ "eval_runtime": 22.6853,
36
+ "eval_samples_per_second": 45.977,
37
+ "eval_steps_per_second": 5.775,
38
  "step": 4276
39
  },
40
  {
47
  "epoch": 3.0,
48
  "eval_loss": 0.624345064163208,
49
  "eval_matthews_correlation": 0.0,
50
+ "eval_runtime": 22.6868,
51
+ "eval_samples_per_second": 45.974,
52
+ "eval_steps_per_second": 5.774,
53
  "step": 6414
54
  },
55
  {
57
  "step": 6414,
58
  "total_flos": 1.6048929796061184e+16,
59
  "train_loss": 0.6174308222552717,
60
+ "train_runtime": 2128.6729,
61
+ "train_samples_per_second": 12.051,
62
+ "train_steps_per_second": 3.013
63
  }
64
  ],
65
  "max_steps": 6414,