DuongTrongChi commited on
Commit
1ea25ac
·
verified ·
1 Parent(s): 62a2d9b

Training in progress, step 362, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e964069ed6905838724c8bddb757b9081b6303c228688b0ed62c673c8563f016
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fb2843ddc4cba95974551863bba6c4935b61fcb31a72746a913a75afce38248
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a685eded7eb7c5ae5ff5440af83afaceebf3da7612bb42df8148022ad92f5c61
3
  size 37431220
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ebc82a6b239be7744ec22dd39159be08a7a1faea8b33f8524f88b458b12105
3
  size 37431220
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:358cc543a4dfee9cdbd11d603288fa82292225e6222d3a6078f1df3f3c96f685
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:febf6ccb9fdc9f04c34f343b5c08edd19841817cf6f806550bdab6dba83f9228
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.99039780521262,
5
  "eval_steps": 500,
6
- "global_step": 361,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -2534,6 +2534,13 @@
2534
  "learning_rate": 2.2727272727272728e-06,
2535
  "loss": 1.0866,
2536
  "step": 361
 
 
 
 
 
 
 
2537
  }
2538
  ],
2539
  "logging_steps": 1,
@@ -2553,7 +2560,7 @@
2553
  "attributes": {}
2554
  }
2555
  },
2556
- "total_flos": 4.468104090052854e+17,
2557
  "train_batch_size": 4,
2558
  "trial_name": null,
2559
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9931412894375857,
5
  "eval_steps": 500,
6
+ "global_step": 362,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
2534
  "learning_rate": 2.2727272727272728e-06,
2535
  "loss": 1.0866,
2536
  "step": 361
2537
+ },
2538
+ {
2539
+ "epoch": 0.9931412894375857,
2540
+ "grad_norm": 0.16839098930358887,
2541
+ "learning_rate": 1.5151515151515152e-06,
2542
+ "loss": 1.1158,
2543
+ "step": 362
2544
  }
2545
  ],
2546
  "logging_steps": 1,
 
2560
  "attributes": {}
2561
  }
2562
  },
2563
+ "total_flos": 4.48001389334913e+17,
2564
  "train_batch_size": 4,
2565
  "trial_name": null,
2566
  "trial_params": null