jssky commited on
Commit
d781d02
·
verified ·
1 Parent(s): 2a46b3c

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:009435752cba422c5e8cbaf14d90b8c439ea6b7fd0dc7358e968cc0a4b9122f3
3
  size 50503544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:550f93216f0b5f3fdf4bf2efe0f7225b795fc220a07384321b81741105d9e069
3
  size 50503544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97081d766c1efd083986e7037f3441e71755761df25e179dc3334cdf6088b140
3
  size 25986148
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbe3a8b2e24fdc50dfe38d273f9deaf75d4da9a207f66628d6a977773660e828
3
  size 25986148
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f50d1f2a647ab66bf93520813e13396221f342eeb0033fac7d886683239dbca
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22ff52b36e238ec8c5e0ae77ac3a583321bf95dd765824a123fa18ceebc689e0
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8066cf8d591755892e9112cdbf2b6cedcdc6a2248abd6ea2145bf28de0d8d85f
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b4c9435b0b42cc713eea6ce123a4d1aaa03f4cdaabf4128ab6be48043d8bc62
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ecffe7252c8c9baeec2930898096ca83078383402ee33b5b0186d53d3b0ca53
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2e2aa09dba491989d2e653b5122858cda9732d0dc8bda6aad86d87f1fcf803
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4612ac416d87f114d4517611323e4353adc5c12edfd9a825bfd49510f2c555e7
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab66a9e238747970935c296838109efc33d576c0992707e87ca257f11ab75f6e
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87a58c8092333296a66f332b13e3b0089eabe239eaa24306cbe2a62602f3ecdf
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ab3b4e07057099d0e9661e1108f2c94b4126ad0ab0c44ca9af6bb3bd2b9917
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fabd0190b381df37676269268d272e959c191aa77066c59eec355ac0d052d21
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93d9cfb36627643297556d68c2fd167c699a88be208868dcbda74b3ac3776f89
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ce7d88d0986f2975640fe8d0812c75f9e9b7879cde5110f70aad32b8c02d3be
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93cbba61e44f8fd9c87c04ea2cdc110c1935c7ab4cc89cedce4b353e290f89c1
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aff709ea200ea8eb08d4178c7dddb1a3a3a68d69709bda0ce59028a7312d1c52
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:265760fe9788697ec3bf61fb178eb21105e6530a3fc23196bb8dddc8fa2ea6db
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a93b2a1f4b5368650119fe6e0d6eec6d19cda6badeba4d21943ab48964fa00
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.02102803738317757,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 118.252,
103
  "eval_steps_per_second": 14.925,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 7411455158648832.0,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.02336448598130841,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 118.252,
103
  "eval_steps_per_second": 14.925,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.02336448598130841,
108
+ "grad_norm": 0.48678022623062134,
109
+ "learning_rate": 0.00016,
110
+ "loss": 1.6706,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 8234950176276480.0,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null