naman1011 commited on
Commit
e9d0f84
·
1 Parent(s): c28e416

Training in progress, step 1500, checkpoint

Browse files
last-checkpoint/global_step1500/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad45807b213eb148d0bdcbc685c255f57eeaafd1adf4fa191e60aebec46e8742
3
+ size 77125
last-checkpoint/global_step1500/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58a9529806b74369e61ae304c3d3053fd0187f1bc4e986ca2dcc7f1fc9afd449
3
+ size 181523565
last-checkpoint/global_step1500/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:396a26d95b53e4e5870eae98798d41db844210f38e705aed71ea34c9b6f84cf8
3
+ size 76997
last-checkpoint/global_step1500/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc4b938d275f542c62dc6288898a7b28064ed43540f5f8dc2a06d1aac6e03c45
3
+ size 181523565
last-checkpoint/global_step1500/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a8bd5b3b5268efb898fe728303d908983623e05d8e6c3cec43982cf12bafa5
3
+ size 76997
last-checkpoint/global_step1500/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da8c00e46c3bc4c0821ea7b20b84073c03bfa324cb710027303657f7a06b0d0b
3
+ size 181523565
last-checkpoint/global_step1500/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62334d958c423aa318ab2649fc7949e8fee64bc7ab618ac1403aa296b2f74fdd
3
+ size 76997
last-checkpoint/global_step1500/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12c10faf7f0180ab70dd51abc957a2dbda112ba269a717d8d027b5569120eef2
3
+ size 181523565
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1000
 
1
+ global_step1500
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9c2bbd8242bb5c02d5efae94f8f42fb03edd2c72266a812ab965e463320da46
3
  size 242070038
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194af0302478c97171645454a5eb846b0fc5f8e392d4e3959fa03596fc8e4026
3
  size 242070038
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dce2c50c7664fbb16a8b2e43e54b53331c5316cfb271b983da1e5fecb8f17cbd
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d3cf537aeb636d74260ac33f9ee9f5f5488cd868e57c67412d317e90d714583
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0840849d39e1eaa57787311e4d0c83224a6ddc9e6a9cb14192c8ed84be6eab9
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f46e6b131c11a49aaf40dd0567abef518102c7a1352bb71be9e97f08d2acdd07
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9eab21c7407cea42cd27eaeed6921c9d828e73c23bb9f05f571d16961ccadac8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af26ea8cc81928ae6c96810dd49af32aaee79970eeeea540d94edd0eded31879
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3aa9b8022f28fa939456417d280e7aafb2c4ebe7a3815d932c02df2e413189df
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28da90f216354525bfc6e2c4fb7d9537e9448788220df6cdda43e8d5ba71d985
3
  size 15024
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -19,13 +19,19 @@
19
  "learning_rate": 0.01,
20
  "loss": 0.1287,
21
  "step": 1000
 
 
 
 
 
 
22
  }
23
  ],
24
  "logging_steps": 500,
25
  "max_steps": 2500,
26
  "num_train_epochs": 10,
27
  "save_steps": 500,
28
- "total_flos": 169032155136.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.0,
5
  "eval_steps": 500,
6
+ "global_step": 1500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
19
  "learning_rate": 0.01,
20
  "loss": 0.1287,
21
  "step": 1000
22
+ },
23
+ {
24
+ "epoch": 6.0,
25
+ "learning_rate": 0.01,
26
+ "loss": 0.1689,
27
+ "step": 1500
28
  }
29
  ],
30
  "logging_steps": 500,
31
  "max_steps": 2500,
32
  "num_train_epochs": 10,
33
  "save_steps": 500,
34
+ "total_flos": 253548232704.0,
35
  "trial_name": null,
36
  "trial_params": null
37
  }