tuanna08go commited on
Commit
852342a
·
verified ·
1 Parent(s): 1d337d9

Training in progress, step 26, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc64c7aca36b556493920a1579db632d1384c45a36ac185dec3b8e1d4b492c78
3
  size 390888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1040f95c6f7f116c38c2bf7eea8a30f200d211cbf352a6bad03b1af94fc0fa
3
  size 390888
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db8b85c338c34db5bcf64595492716fa17a71815ec97d9e7e13c35a583c7b157
3
  size 819770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fc2703554c63a96579e1a3220d5c9bfa89139b0a551397d9442451ce0bb0298
3
  size 819770
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1702dcc0f9d9a8f9c63e74896356a19749f4963949bab512e43e702fe77962c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dff7474c416c2bfd55209bee67ee6bd1d6630537f2cf74fba6d21acac7fd83c4
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0fc309d4608eca7c1f00c14befe35df8d98572a350ac190aaac790dc1a0befb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5d17cc7d96fbe24ad40a731f4825abc56336860d89f3ac12726fee59c43123c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.8096385542168675,
5
  "eval_steps": 6,
6
- "global_step": 21,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -53,6 +53,14 @@
53
  "learning_rate": 1.4644660940672627e-05,
54
  "loss": 8.7746,
55
  "step": 20
 
 
 
 
 
 
 
 
56
  }
57
  ],
58
  "logging_steps": 10,
@@ -67,12 +75,12 @@
67
  "should_evaluate": false,
68
  "should_log": false,
69
  "should_save": true,
70
- "should_training_stop": false
71
  },
72
  "attributes": {}
73
  }
74
  },
75
- "total_flos": 22027670913024.0,
76
  "train_batch_size": 8,
77
  "trial_name": null,
78
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0313253012048194,
5
  "eval_steps": 6,
6
+ "global_step": 26,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
53
  "learning_rate": 1.4644660940672627e-05,
54
  "loss": 8.7746,
55
  "step": 20
56
+ },
57
+ {
58
+ "epoch": 0.9253012048192771,
59
+ "eval_loss": 8.70206356048584,
60
+ "eval_runtime": 0.6614,
61
+ "eval_samples_per_second": 264.61,
62
+ "eval_steps_per_second": 33.265,
63
+ "step": 24
64
  }
65
  ],
66
  "logging_steps": 10,
 
75
  "should_evaluate": false,
76
  "should_log": false,
77
  "should_save": true,
78
+ "should_training_stop": true
79
  },
80
  "attributes": {}
81
  }
82
  },
83
+ "total_flos": 27272354463744.0,
84
  "train_batch_size": 8,
85
  "trial_name": null,
86
  "trial_params": null