redo-checkpoint-224000

Files changed (13) hide show

config.json CHANGED Viewed

@@ -1,8 +1,7 @@
 {
-  "_name_or_path": "stanford-crfm/celebrimbor-gpt2-medium-x81",
   "activation_function": "gelu_new",
   "architectures": [
-    "GPT2LMHeadModel"
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
@@ -20,10 +19,7 @@
   "n_positions": 1024,
   "n_special": 0,
   "predict_special_tokens": true,
-  "reorder_and_upcast_attn": true,
   "resid_pdrop": 0.1,
-  "scale_attn_by_inverse_layer_idx": true,
-  "scale_attn_weights": true,
   "summary_activation": null,
   "summary_first_dropout": 0.1,
   "summary_proj_to_labels": true,
@@ -35,7 +31,7 @@
       "max_length": 50
     }
   },
-  "transformers_version": "4.12.5",
   "use_cache": false,
   "vocab_size": 50257
 }

 {
   "activation_function": "gelu_new",
   "architectures": [
+    "MistralGPT2LMHeadModel"
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
   "n_positions": 1024,
   "n_special": 0,
   "predict_special_tokens": true,
   "resid_pdrop": 0.1,
   "summary_activation": null,
   "summary_first_dropout": 0.1,
   "summary_proj_to_labels": true,
       "max_length": 50
     }
   },
+  "transformers_version": "4.5.0",
   "use_cache": false,
   "vocab_size": 50257
 }

global_step224011/mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8611392c1049fdee0b542a4d29ca144bb1334dbf899a492476b85fce595c686d
+size 734886248

global_step224011/zero_pp_rank_0_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:af2e21f391c6c933293b8cbe894d7e309e237483c4181568be0812da21d9f5ff
+size 266119242

global_step224011/zero_pp_rank_1_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6987ab58104ccd96f9a91d4aa0bdee6b000cc30cceaf61679ff6783a3974db06
+size 266119242

global_step224011/zero_pp_rank_2_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9431fb909beb02d5b6584ed7a03d2fd9e261a492d66acda68416a91629932776
+size 266119242

global_step224011/zero_pp_rank_3_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c750457f453fed4d6630433b463f16221a5825ba5c91c749b9e5fb0eed7da0a
+size 266119242

global_step224011/zero_pp_rank_4_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c9ccbbe6b268c400946299a37e17140472d52d8738cd5bd082b780cf09fa9196
+size 266119242

global_step224011/zero_pp_rank_5_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4faeee1db3554f70d5e443bd5070ad51e1a5a279066a3728b325abaad9b43bc7
+size 266119242

global_step224011/zero_pp_rank_6_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6181d85ae79147c88c4a80045edd7dbda650d7b47be192ac2dcc03c8780bfa6
+size 266119242

global_step224011/zero_pp_rank_7_mp_rank_00optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba264912db52c13d29e971efd258b5edbb9fe5fdd1cb0cd5cb85c0b4d4fed220
+size 266119242

latest CHANGED Viewed

	@@ -1 +1 @@
1	- ~~global_step99004~~


1	+ global_step224011

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dc2666775d30b92af2628777c6e0847c5f526182ba8a111a1978760e6198aedb
 size 734885928

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb1387226a204beb240f551b88f183d99903f7fca6a85e1a0fb95b7fdaf5a242
 size 734885928

trainer_state.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:090ef154fad084210cc130292d9f3fa9b4d4bbe24a29f527df898b2fbf1756ba
-size 6922082

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab15f7b14dd53416bc7ad71fa88e82e50a944cde9da707484f962e51dba0c31d
+size 15668929