Theoreticallyhugo commited on
Commit
8100d0f
1 Parent(s): 6acf2d0

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ef9cbea4284aab780e4dfcae38caec260a206288c47dbe643fa2388ac84a0e9
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cde84e40589a581099de6ffd2b1dfb10787b5c8d90d303ed810a70a33697cd5
3
  size 592330980
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b929b09b8681501786d959eed9fa2f0053e4905bde89144f635820c2db40adf5
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f651f65956ed08780348bf8bfcaac2b4e5a12648ffed35bb061a6ba26807bf7
3
  size 1014670074
checkpoint-41/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b75d0f85c6e5f43bda08f24453a869f5d0b5d0d33d936ef1b542f406f081347
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a939982f711c8a91f0893b4f281f0db4fd89d7ca52de2aed82098ef9ff76ea2
3
  size 14244
checkpoint-41/trainer_state.json CHANGED
@@ -14,60 +14,60 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 339.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 160.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.7931404072883173,
27
- "precision": 0.8,
28
- "recall": 0.7863974495217854,
29
- "support": 941.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.40067911714770804,
33
- "precision": 0.46561443066516345,
34
- "recall": 0.35163899531715626,
35
- "support": 4698.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.5607655502392344,
39
- "precision": 0.4144271570014144,
40
- "recall": 0.8668639053254438,
41
- "support": 2028.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8556539864512767,
45
- "precision": 0.8844441252513645,
46
- "recall": 0.8286790929277976,
47
- "support": 14861.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.9839078762825717,
51
- "precision": 0.9700167382286587,
52
- "recall": 0.9982026510896428,
53
- "support": 13353.0
54
  },
55
- "eval_accuracy": 0.8189664650907091,
56
- "eval_loss": 0.4724249243736267,
57
  "eval_macro avg": {
58
- "f1-score": 0.5134495624870155,
59
- "precision": 0.5049289215923716,
60
- "recall": 0.5473974420259752,
61
- "support": 36380.0
62
  },
63
- "eval_runtime": 1.4721,
64
- "eval_samples_per_second": 55.025,
65
- "eval_steps_per_second": 7.473,
66
  "eval_weighted avg": {
67
- "f1-score": 0.8141826255128369,
68
- "precision": 0.8212499318469384,
69
- "recall": 0.8189664650907091,
70
- "support": 36380.0
71
  },
72
  "step": 41
73
  }
@@ -77,7 +77,7 @@
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
- "total_flos": 143344257399000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 271.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 139.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.778263585259213,
27
+ "precision": 0.643595041322314,
28
+ "recall": 0.9842022116903634,
29
+ "support": 633.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.5213290460878884,
33
+ "precision": 0.4563708012760368,
34
+ "recall": 0.6078480379905024,
35
+ "support": 4001.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.520462355513902,
39
+ "precision": 0.7011784511784511,
40
+ "recall": 0.4138102334823646,
41
+ "support": 2013.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8648793805666204,
45
+ "precision": 0.8778050331607159,
46
+ "recall": 0.8523288637967537,
47
+ "support": 11336.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.9947169811320755,
51
+ "precision": 0.9991081780076697,
52
+ "recall": 0.9903642149929278,
53
+ "support": 11312.0
54
  },
55
+ "eval_accuracy": 0.8332940582393537,
56
+ "eval_loss": 0.4083092212677002,
57
  "eval_macro avg": {
58
+ "f1-score": 0.5256644783656713,
59
+ "precision": 0.5254367864207411,
60
+ "recall": 0.5497933659932731,
61
+ "support": 29705.0
62
  },
63
+ "eval_runtime": 1.4074,
64
+ "eval_samples_per_second": 56.843,
65
+ "eval_steps_per_second": 7.105,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.830926787853407,
68
+ "precision": 0.8381591322948091,
69
+ "recall": 0.8332940582393537,
70
+ "support": 29705.0
71
  },
72
  "step": 41
73
  }
 
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
+ "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3e60aef760c0bebacd32c85d34779d7bd28b7fb5a467a761ffe5e8a7e5bb2bb
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e06f6b44c30fa94c6272333e445e6562930fffeb3ba856f3a9330b45193b951f
3
  size 4728