nour4286 commited on
Commit
0b6477f
1 Parent(s): 76ebe7e

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-1528/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e046d25e4ad5c74b91be4fd3536533fc0663fa47e08b72382d149f3176a5d205
3
  size 557116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74e357ce0b7042a6f40e5f45c53ad211d929476c8e3445c880e62339e20b708b
3
  size 557116312
checkpoint-1528/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae7c16a498d582599cd05fbab821d1100a28ed8fbbbe5e414bac30bd70fe8299
3
  size 1113991930
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe26fcb5c0e353bf67a52789fb4cfae7be61e381b062d125ca91b1c604de9b5
3
  size 1113991930
checkpoint-1528/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8e6dccea0da7d7eff4bfe6269cc5b94b43442b566ea0f37db1b49e1824d969a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a1c88126ef67a930b2cd0c54619e80f9ef80c6abae00cbf436ab3946bd2d2c0
3
  size 1064
checkpoint-1528/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 25.4493,
3
- "best_model_checkpoint": "my-model/checkpoint-1528",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 1528,
@@ -10,41 +10,41 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.32722513089005234,
13
- "grad_norm": 0.41872361302375793,
14
- "learning_rate": 4.836387434554974e-05,
15
- "loss": 0.0155,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.6544502617801047,
20
- "grad_norm": 2.3573551177978516,
21
- "learning_rate": 4.6727748691099475e-05,
22
- "loss": 0.0193,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.981675392670157,
27
- "grad_norm": 2.1439473628997803,
28
- "learning_rate": 4.5091623036649215e-05,
29
- "loss": 0.0231,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 1.0,
34
- "eval_loss": 5.686821937561035,
35
- "eval_rouge1": 25.4493,
36
- "eval_rouge2": 10.1381,
37
- "eval_rougeL": 22.2977,
38
- "eval_runtime": 389.9026,
39
- "eval_samples_per_second": 5.63,
40
- "eval_steps_per_second": 0.564,
41
  "step": 1528
42
  }
43
  ],
44
  "logging_steps": 500,
45
- "max_steps": 15280,
46
  "num_input_tokens_seen": 0,
47
- "num_train_epochs": 10,
48
  "save_steps": 500,
49
  "stateful_callbacks": {
50
  "TrainerControl": {
 
1
  {
2
+ "best_metric": 25.2705,
3
+ "best_model_checkpoint": "./ArabartModel-1/checkpoint-1528",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 1528,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.32722513089005234,
13
+ "grad_norm": 1.563672423362732,
14
+ "learning_rate": 4.6727748691099475e-05,
15
+ "loss": 0.0195,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.6544502617801047,
20
+ "grad_norm": 1.7397737503051758,
21
+ "learning_rate": 4.3455497382198955e-05,
22
+ "loss": 0.0244,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.981675392670157,
27
+ "grad_norm": 3.006633758544922,
28
+ "learning_rate": 4.018324607329843e-05,
29
+ "loss": 0.0293,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 1.0,
34
+ "eval_loss": 5.626201629638672,
35
+ "eval_rouge1": 25.2705,
36
+ "eval_rouge2": 9.9865,
37
+ "eval_rougeL": 21.8678,
38
+ "eval_runtime": 372.5145,
39
+ "eval_samples_per_second": 5.892,
40
+ "eval_steps_per_second": 0.591,
41
  "step": 1528
42
  }
43
  ],
44
  "logging_steps": 500,
45
+ "max_steps": 7640,
46
  "num_input_tokens_seen": 0,
47
+ "num_train_epochs": 5,
48
  "save_steps": 500,
49
  "stateful_callbacks": {
50
  "TrainerControl": {
checkpoint-1528/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0647ffd63ecebccd487ca666ebff2e4007c4297f5565f476a9bab5a6aa5081d1
3
- size 6968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db0c5c28c9a1e67e13675dc0782cb65baca4516e1c39cf487f5c45dc85be680
3
+ size 6904