Francesco0101 commited on
Commit
7788903
1 Parent(s): ee5d02d

Training in progress, step 6000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c7e78804dd19cd55c65a1b6b95b5c55996dc7c4a8c1d11b210ee7423c2313fc
3
  size 267835644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a04667c008502e91e06fe4ddbdbe9546b47afa389d863fcab516dd677024a7a
3
  size 267835644
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:379de5d281003514e53cff5d5da207fad69f34d9d6b845d9d7026096a123dc3e
3
  size 535733434
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1976ef43ce351bc5e7482a4f88d5b02ba7afb62acc5f9c10faaf9ea69ee52ad
3
  size 535733434
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca9f956b39f51ec6c505767cab574a3581a608a9ada47e5e1ea34242b023aaa2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b9ae8ccced4a36fd061b274c705b6295d38a5288bf82c4c189b032dcc5f78bb
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27ebe124b49d962b3686f19f4ac88c29ccf1175d00244819004baf43745fc5ca
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87a047fc70d34ba9e25294567dfd8e018dbff83f6d11a990d60dd7e409be4fbb
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.7293047058493298,
3
  "best_model_checkpoint": "training_dir/checkpoint-5000",
4
- "epoch": 0.7829627309740056,
5
  "eval_steps": 1000,
6
- "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,25 @@
102
  "eval_samples_per_second": 76.93,
103
  "eval_steps_per_second": 9.616,
104
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1000,
@@ -121,7 +140,7 @@
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 5037055031256768.0,
125
  "train_batch_size": 8,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": 0.7293047058493298,
3
  "best_model_checkpoint": "training_dir/checkpoint-5000",
4
+ "epoch": 0.9395552771688067,
5
  "eval_steps": 1000,
6
+ "global_step": 6000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 76.93,
103
  "eval_steps_per_second": 9.616,
104
  "step": 5000
105
+ },
106
+ {
107
+ "epoch": 0.9395552771688067,
108
+ "grad_norm": 16.398216247558594,
109
+ "learning_rate": 9.131944444444445e-06,
110
+ "loss": 0.4562,
111
+ "step": 6000
112
+ },
113
+ {
114
+ "epoch": 0.9395552771688067,
115
+ "eval_accuracy": 0.728583916083916,
116
+ "eval_f1": 0.722523941260205,
117
+ "eval_loss": 0.764935314655304,
118
+ "eval_precision": 0.7390044648352858,
119
+ "eval_recall": 0.728583916083916,
120
+ "eval_runtime": 29.8199,
121
+ "eval_samples_per_second": 76.727,
122
+ "eval_steps_per_second": 9.591,
123
+ "step": 6000
124
  }
125
  ],
126
  "logging_steps": 1000,
 
140
  "attributes": {}
141
  }
142
  },
143
+ "total_flos": 6048548589955680.0,
144
  "train_batch_size": 8,
145
  "trial_name": null,
146
  "trial_params": null