DuongTrongChi commited on
Commit
90af786
·
verified ·
1 Parent(s): 6fba38a

Training in progress, step 81, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc941af358c41fdacb4643bbfec2e2f6cedd8ccebc8d32a056a9fe1f0067a572
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c0b9b66eb18cf0b855508e06ba01803083db1d16dbf2b0fffd8f4d3ca32afc1
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:171a625f2f946875f946841d317f73ae901bc37acb6617c511d58b5b274af3c6
3
  size 37430836
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1ee4c082d32f2e525bbdd97fd0fb1392f16516055373773711cc8ff57d3b7d8
3
  size 37430836
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a97cd7f079d7f12ed4724344a7cbd6b5515d4008435f2e5a63f0ce71a90c202c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92cb433dd7b6353454fd7a1a5cd6ae3809d9ab1ab0b7913e6509216203ba9cb2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.2139917695473251,
5
  "eval_steps": 500,
6
- "global_step": 78,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -553,6 +553,27 @@
553
  "learning_rate": 0.00015600000000000002,
554
  "loss": 1.2942,
555
  "step": 78
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
556
  }
557
  ],
558
  "logging_steps": 1,
@@ -572,7 +593,7 @@
572
  "attributes": {}
573
  }
574
  },
575
- "total_flos": 9.669833466976666e+16,
576
  "train_batch_size": 4,
577
  "trial_name": null,
578
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.2222222222222222,
5
  "eval_steps": 500,
6
+ "global_step": 81,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
553
  "learning_rate": 0.00015600000000000002,
554
  "loss": 1.2942,
555
  "step": 78
556
+ },
557
+ {
558
+ "epoch": 0.2167352537722908,
559
+ "grad_norm": 0.09426167607307434,
560
+ "learning_rate": 0.00015800000000000002,
561
+ "loss": 1.333,
562
+ "step": 79
563
+ },
564
+ {
565
+ "epoch": 0.2194787379972565,
566
+ "grad_norm": 0.09674811363220215,
567
+ "learning_rate": 0.00016,
568
+ "loss": 1.3242,
569
+ "step": 80
570
+ },
571
+ {
572
+ "epoch": 0.2222222222222222,
573
+ "grad_norm": 0.09802138805389404,
574
+ "learning_rate": 0.000162,
575
+ "loss": 1.3322,
576
+ "step": 81
577
  }
578
  ],
579
  "logging_steps": 1,
 
593
  "attributes": {}
594
  }
595
  },
596
+ "total_flos": 1.0050886434935194e+17,
597
  "train_batch_size": 4,
598
  "trial_name": null,
599
  "trial_params": null