jasmeeetsingh commited on
Commit
c4dbbab
1 Parent(s): 9c1cb5e

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6998285b83c76b0c8b6261fb7f1bb65a13840c8bfcb02db5d5784746fb776e63
3
  size 8970189
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90c26c9d06a857c490bef2859c8d9f1a0df37d5078b3e76552e968745a76cdbb
3
  size 8970189
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9777e399c5a17fcd276312001542df42c3c884bfe4fa754694aebf70985a4be4
3
+ size 7759329147
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b185933120aaf5215bc19c0c41f20104627755b914b9f533e8c56e633bb5bb9d
3
+ size 13335934
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:793b34614c8c421107b416c21ed218bd3c76454d7c55652f8dd40224ad56acf2
3
+ size 7759329083
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f7c46f9c9f3f39d393bfa9eed0097e1efaee498dc202d6998d5983141217dd0
3
+ size 13335934
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d068479861b4e3aa01cda6948696a728b25fe9cfc026ffee836125e7b5efbdc
3
+ size 7759329083
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3629c1db35c1f44aebbd79af1eeb8d6de04795a82247c8064bc0f34c2f97ed44
3
+ size 13335934
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8157e4a6536a415ef623da111bfde901cc9eb5723a8e369300103093e7512b7f
3
+ size 7759329083
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:748b92ff50023d3b0f8d4b898ea05f11694fdcdf6d5b92b69f866c739a2b59f0
3
+ size 13335934
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1000
 
1
+ global_step2000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:467da56e383df870490dbb76caaf8269822eb56c33567fa108671031d311e54c
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f36f3108739132271885035e5faf177e77e529c599274b592066cfd46847f09
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ff1d2f7bd6edc0356aa4f5a34a2b19007ea4f6bfc18a8a03d3a5b32f347424b
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52c562c02b52d9091784791fd63a8de14c04f388fc95bf7cfc96a06c0d535229
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8e0752d412861e016be27a2016704d4dff7c30ba565cc508e85a549ef1682e4
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:854590c01dfe34d93f0fa12d48d05e5d5bcb7605ecd3692ab90d1341b4528c3b
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4174d249caf0ec0afeb299e38a8ea8d074ed385ffdd6c43c6712d2b378e5ea3
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f023641060de0ce868c668d29989cc44bffe8e1bb9aea8330ec656170354cf64
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.39093041438623927,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -13,13 +13,19 @@
13
  "learning_rate": 1e-05,
14
  "loss": 0.9471,
15
  "step": 1000
 
 
 
 
 
 
16
  }
17
  ],
18
  "logging_steps": 1000,
19
  "max_steps": 7674,
20
  "num_train_epochs": 3,
21
  "save_steps": 1000,
22
- "total_flos": 13615232974848.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7818608287724785,
5
  "eval_steps": 500,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
13
  "learning_rate": 1e-05,
14
  "loss": 0.9471,
15
  "step": 1000
16
+ },
17
+ {
18
+ "epoch": 0.78,
19
+ "learning_rate": 1e-05,
20
+ "loss": 0.7436,
21
+ "step": 2000
22
  }
23
  ],
24
  "logging_steps": 1000,
25
  "max_steps": 7674,
26
  "num_train_epochs": 3,
27
  "save_steps": 1000,
28
+ "total_flos": 27337888366592.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }