dq158 commited on
Commit
aa61544
1 Parent(s): 4493c49

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/global_step2371/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f3e5e7e338e56c0fbb48dba67f5ad0e53df13693caeda65462254f6067e8d9f
3
+ size 28315088
last-checkpoint/global_step2371/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d8f7b1661851c1b8fbee6ffeba88cce356bccb656ec91070303ba55c1fc1eb2
3
+ size 28315088
last-checkpoint/global_step2371/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b8c03a6449fd7949a535a46dce0b2d86946a69c104e0bbe9fe2ac1a6e1cc5be
3
+ size 2850543502
last-checkpoint/global_step2371/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f0963d69e05ca8b0f098eb885f18d94e378a847bcb3061cf12600b23aec9607
3
+ size 2850543310
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1581
 
1
+ global_step2371
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f08f5222c04ba8a25b70996b406c1e95dc834c73f15f3e7248da94c55fa3d6d3
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ebcc4f849c319e84877c5a5616307940f594a3127631dce316993029034eeb0
3
  size 14512
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:707f46a874ccec694d9a9ebdb8230159a79dc68e5bca12742f90f6e6d892b27e
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05b01af9cac14bdb0b4fce5f6be228a514d12ae472bc890371393ba7752dafc0
3
  size 14512
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.288722038269043,
3
- "best_model_checkpoint": "dq158/pingusPongus/checkpoint-1581",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 1581,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -63,13 +63,38 @@
63
  "eval_steps_per_second": 0.131,
64
  "eval_translation_length": 53391,
65
  "step": 1581
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
66
  }
67
  ],
68
  "logging_steps": 500,
69
  "max_steps": 23700,
70
  "num_train_epochs": 30,
71
  "save_steps": 500,
72
- "total_flos": 771945142419456.0,
73
  "trial_name": null,
74
  "trial_params": null
75
  }
 
1
  {
2
+ "best_metric": 2.2401010990142822,
3
+ "best_model_checkpoint": "dq158/pingusPongus/checkpoint-2371",
4
+ "epoch": 2.9993674889310564,
5
  "eval_steps": 500,
6
+ "global_step": 2371,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
63
  "eval_steps_per_second": 0.131,
64
  "eval_translation_length": 53391,
65
  "step": 1581
66
+ },
67
+ {
68
+ "epoch": 2.53,
69
+ "learning_rate": 0.0001,
70
+ "loss": 2.4165,
71
+ "step": 2000
72
+ },
73
+ {
74
+ "epoch": 3.0,
75
+ "eval_bleu": 1.0,
76
+ "eval_brevity_penalty": 1.0,
77
+ "eval_length_ratio": 1.0,
78
+ "eval_loss": 2.2401010990142822,
79
+ "eval_precisions": [
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0
84
+ ],
85
+ "eval_reference_length": 53401,
86
+ "eval_runtime": 1342.5303,
87
+ "eval_samples_per_second": 2.094,
88
+ "eval_steps_per_second": 0.131,
89
+ "eval_translation_length": 53401,
90
+ "step": 2371
91
  }
92
  ],
93
  "logging_steps": 500,
94
  "max_steps": 23700,
95
  "num_train_epochs": 30,
96
  "save_steps": 500,
97
+ "total_flos": 1158039818207232.0,
98
  "trial_name": null,
99
  "trial_params": null
100
  }