iamnguyen commited on
Commit
6e9d640
·
verified ·
1 Parent(s): 511c64a

Training in progress, step 16, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21a2f62efd0d71d0d134266e515dda3b88038f99e0b24c6a836737401f2339a3
3
  size 2964338224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07e1ddb55498e50628c3310f9086dc621dc5fb0c6268ed92605cab47f2644b67
3
  size 2964338224
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9bb165d055492bacaa7fc7f6a4b7aa35f27f884ae2282741026ab19d8357fdb
3
  size 1485440604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3df4c3f5410aef96aa5d1b1220d16d0e42419e2f967dd28291d6cd8a4e444dc
3
  size 1485440604
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c200f8fdcde78c415e4babf1b6f200bbf13323757b5b248ace34314bfbe3fd44
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:927fd63e57181ecc0ac827facbdec2bc46e991f92e1716e5d98f2005a0b865c2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.6894075403949731,
5
  "eval_steps": 500,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -91,6 +91,34 @@
91
  "learning_rate": 4.970701059450872e-05,
92
  "loss": 2.2359,
93
  "step": 12
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
94
  }
95
  ],
96
  "logging_steps": 1,
@@ -110,7 +138,7 @@
110
  "attributes": {}
111
  }
112
  },
113
- "total_flos": 8132581322686464.0,
114
  "train_batch_size": 2,
115
  "trial_name": null,
116
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9192100538599641,
5
  "eval_steps": 500,
6
+ "global_step": 16,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
91
  "learning_rate": 4.970701059450872e-05,
92
  "loss": 2.2359,
93
  "step": 12
94
+ },
95
+ {
96
+ "epoch": 0.7468581687612208,
97
+ "grad_norm": 1.6817108392715454,
98
+ "learning_rate": 4.934238559694448e-05,
99
+ "loss": 2.2229,
100
+ "step": 13
101
+ },
102
+ {
103
+ "epoch": 0.8043087971274686,
104
+ "grad_norm": 1.6007517576217651,
105
+ "learning_rate": 4.8834909801373264e-05,
106
+ "loss": 2.203,
107
+ "step": 14
108
+ },
109
+ {
110
+ "epoch": 0.8617594254937163,
111
+ "grad_norm": 1.457571029663086,
112
+ "learning_rate": 4.8187561277552374e-05,
113
+ "loss": 2.0994,
114
+ "step": 15
115
+ },
116
+ {
117
+ "epoch": 0.9192100538599641,
118
+ "grad_norm": 1.486559271812439,
119
+ "learning_rate": 4.740413892402639e-05,
120
+ "loss": 2.1777,
121
+ "step": 16
122
  }
123
  ],
124
  "logging_steps": 1,
 
138
  "attributes": {}
139
  }
140
  },
141
+ "total_flos": 1.0873463700504576e+16,
142
  "train_batch_size": 2,
143
  "trial_name": null,
144
  "trial_params": null