Theoreticallyhugo commited on
Commit
611a6d2
1 Parent(s): 6c1f56c

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88c07cbc53c51f5c54df711ef5979bc1f3418049f6d85a04b3dbda81a97924a1
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69b9ba937b00c0bff3bf5290f197251c779721017cdb182752b71e8c7bfa7a9c
3
  size 592330980
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:607460e5b1146da32c681dd270585cfb7f0e8ea70592e43e5c102d6094ae78cc
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08e3e7034f6ea0face55aa4d5a5b9cf98d774aefa195cee077742d829291fbb1
3
  size 1014670074
checkpoint-41/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2edfde65f52fe0fcbc13f549dfed4fa891e3eb1476a6c03774294faa3865fa33
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea37e94b47f3f494a56a7641c427579f080658979e969fdceddf122598ddd745
3
  size 1064
checkpoint-41/trainer_state.json CHANGED
@@ -14,68 +14,68 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 271.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 139.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.22222222222222218,
27
- "precision": 0.780952380952381,
28
- "recall": 0.12954186413902052,
29
- "support": 633.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.3239807781739265,
33
- "precision": 0.42653061224489797,
34
- "recall": 0.26118470382404396,
35
- "support": 4001.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.43526510480887787,
39
- "precision": 0.5735174654752234,
40
- "recall": 0.35072031793343267,
41
- "support": 2013.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8370338686471983,
45
- "precision": 0.7484180515958556,
46
- "recall": 0.9494530698659139,
47
- "support": 11336.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.8603704893457543,
51
- "precision": 0.8500846381718155,
52
- "recall": 0.8709083026230219,
53
- "support": 9226.0
54
  },
55
- "eval_accuracy": 0.7469857706651218,
56
- "eval_loss": 0.6934069395065308,
57
  "eval_macro avg": {
58
- "f1-score": 0.3826960661711399,
59
- "precision": 0.48278616406288194,
60
- "recall": 0.3659726083407761,
61
- "support": 27619.0
62
  },
63
- "eval_runtime": 1.3993,
64
- "eval_samples_per_second": 57.171,
65
- "eval_steps_per_second": 7.146,
66
  "eval_weighted avg": {
67
- "f1-score": 0.7147071394985115,
68
- "precision": 0.7126373293529855,
69
- "recall": 0.7469857706651218,
70
- "support": 27619.0
71
  },
72
  "step": 41
73
  }
74
  ],
75
  "logging_steps": 500,
76
- "max_steps": 656,
77
  "num_input_tokens_seen": 0,
78
- "num_train_epochs": 16,
79
  "save_steps": 500,
80
  "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 284.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 141.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.0028169014084507044,
27
+ "precision": 0.5,
28
+ "recall": 0.0014124293785310734,
29
+ "support": 708.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.2423290994719566,
33
+ "precision": 0.28976109215017065,
34
+ "recall": 0.20824135393671817,
35
+ "support": 4077.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.30434782608695654,
39
+ "precision": 0.5460358056265985,
40
+ "recall": 0.21096837944664032,
41
+ "support": 2024.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8170132059567293,
45
+ "precision": 0.7161945812807882,
46
+ "recall": 0.9508665794637018,
47
+ "support": 12232.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.8384247714048214,
51
+ "precision": 0.8602345415778252,
52
+ "recall": 0.8176935549250102,
53
+ "support": 9868.0
54
  },
55
+ "eval_accuracy": 0.7151087475284653,
56
+ "eval_loss": 0.7737340927124023,
57
  "eval_macro avg": {
58
+ "f1-score": 0.31499025776127354,
59
+ "precision": 0.41603228866219755,
60
+ "recall": 0.31274032816437164,
61
+ "support": 29334.0
62
  },
63
+ "eval_runtime": 1.417,
64
+ "eval_samples_per_second": 56.458,
65
+ "eval_steps_per_second": 7.057,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.6774818055577092,
68
+ "precision": 0.6780466018204494,
69
+ "recall": 0.7151087475284653,
70
+ "support": 29334.0
71
  },
72
  "step": 41
73
  }
74
  ],
75
  "logging_steps": 500,
76
+ "max_steps": 205,
77
  "num_input_tokens_seen": 0,
78
+ "num_train_epochs": 5,
79
  "save_steps": 500,
80
  "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea7dd3e20b3e160af2247e96dc319ccd6cb101ae7dc47f0b44b05679d4ad74d7
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:434fba18a7a4c71e9fb6d8a84b52f11eea7c37f4a33492fefa13b8d79d7d0cd7
3
  size 4664