Shresthadev403 commited on
Commit
8d89165
1 Parent(s): 5198944

End of training

Browse files
README.md CHANGED
@@ -13,12 +13,12 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
- - eval_loss: 1.6092
17
- - eval_runtime: 0.0205
18
- - eval_samples_per_second: 48.823
19
- - eval_steps_per_second: 48.823
20
- - epoch: 64.0
21
- - step: 64
22
 
23
  ## Model description
24
 
 
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - eval_loss: 1.6176
17
+ - eval_runtime: 0.0198
18
+ - eval_samples_per_second: 50.41
19
+ - eval_steps_per_second: 50.41
20
+ - epoch: 65.0
21
+ - step: 65
22
 
23
  ## Model description
24
 
logs/events.out.tfevents.1707026588.d77ab3a64c5c.34.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94232f3ccf63cd83b0fd10a681fe1da1ed75cc824e16fc93d6019254ee1a2bd5
3
- size 24866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a2bcf27210ecac6445b4fe91ea33ce8d1ef0fe1e674dface52bc3202cc443cf
3
+ size 25286
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35477aab7a0d675972e3637322e028ad7b025b3cc2ea5013d9358f7f5b631137
3
  size 497918592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da4205de6c9b412522e8795d80c3b85811b3e3b76a381747df431aa887d43f3b
3
  size 497918592
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.5992611646652222,
3
  "best_model_checkpoint": "controlled-food-recipe-generation/checkpoint-53",
4
- "epoch": 64.0,
5
  "eval_steps": 1,
6
- "global_step": 64,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -903,6 +903,20 @@
903
  "eval_samples_per_second": 48.823,
904
  "eval_steps_per_second": 48.823,
905
  "step": 64
 
 
 
 
 
 
 
 
 
 
 
 
 
 
906
  }
907
  ],
908
  "logging_steps": 1,
@@ -910,7 +924,7 @@
910
  "num_input_tokens_seen": 0,
911
  "num_train_epochs": 100,
912
  "save_steps": 1,
913
- "total_flos": 37626052608000.0,
914
  "train_batch_size": 32,
915
  "trial_name": null,
916
  "trial_params": null
 
1
  {
2
  "best_metric": 1.5992611646652222,
3
  "best_model_checkpoint": "controlled-food-recipe-generation/checkpoint-53",
4
+ "epoch": 65.0,
5
  "eval_steps": 1,
6
+ "global_step": 65,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
903
  "eval_samples_per_second": 48.823,
904
  "eval_steps_per_second": 48.823,
905
  "step": 64
906
+ },
907
+ {
908
+ "epoch": 65.0,
909
+ "learning_rate": 2.7500000000000004e-05,
910
+ "loss": 1.0987,
911
+ "step": 65
912
+ },
913
+ {
914
+ "epoch": 65.0,
915
+ "eval_loss": 1.6176224946975708,
916
+ "eval_runtime": 0.0198,
917
+ "eval_samples_per_second": 50.41,
918
+ "eval_steps_per_second": 50.41,
919
+ "step": 65
920
  }
921
  ],
922
  "logging_steps": 1,
 
924
  "num_input_tokens_seen": 0,
925
  "num_train_epochs": 100,
926
  "save_steps": 1,
927
+ "total_flos": 38213959680000.0,
928
  "train_batch_size": 32,
929
  "trial_name": null,
930
  "trial_params": null