diff --git a/adapter_config.json b/adapter_config.json index 5b3f45c250ff330299d2364a46de0623dadd2f48..7052646debaf453de93d6176727714122c31b64a 100644 --- a/adapter_config.json +++ b/adapter_config.json @@ -15,12 +15,12 @@ "revision": null, "target_modules": [ "q_proj", + "v_proj", "gate_proj", + "up_proj", "o_proj", - "down_proj", "k_proj", - "v_proj", - "up_proj" + "down_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/adapter_model.bin b/adapter_model.bin index 3e8f72f386e2c3fe895fcb01c3f1de5f5fec965a..02526e93c7101a3c9d0727acfe024831696398f1 100644 --- a/adapter_model.bin +++ b/adapter_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:14ca48bd88a31002dc05f9274bc978bc8b5b8ae3e51470e74ee7bc0bb12284e9 +oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95 size 500897101 diff --git a/checkpoint-5000/adapter_model.bin b/checkpoint-5000/adapter_model.bin deleted file mode 100644 index 74814d55a55053c55b191f943aebee3639caff0a..0000000000000000000000000000000000000000 --- a/checkpoint-5000/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:658b9b2dec5afef11956f93a69d1e5899dfaf7ec45314dbb9a4f4fe9a8d341ef -size 500897101 diff --git a/checkpoint-5000/adapter_model/adapter_model.bin b/checkpoint-5000/adapter_model/adapter_model.bin deleted file mode 100644 index 74814d55a55053c55b191f943aebee3639caff0a..0000000000000000000000000000000000000000 --- a/checkpoint-5000/adapter_model/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:658b9b2dec5afef11956f93a69d1e5899dfaf7ec45314dbb9a4f4fe9a8d341ef -size 500897101 diff --git a/checkpoint-5000/optimizer.pt b/checkpoint-5000/optimizer.pt deleted file mode 100644 index 8707c624320e26944a53fa9f047051d0b513a55d..0000000000000000000000000000000000000000 --- a/checkpoint-5000/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:41a19364f98039f3de4a4fce0e0896ae1c403fab5b0de5a6478b8b3154215366 -size 1001752701 diff --git a/checkpoint-5000/rng_state_0.pth b/checkpoint-5000/rng_state_0.pth deleted file mode 100644 index f73c216ce5fd22f5ecf938f9ce19490ebda0e246..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c3591569acf36220e21cfa3f00c334d4afa5214c3fa0f7f20b6081190208a2ce -size 27772 diff --git a/checkpoint-5000/rng_state_1.pth b/checkpoint-5000/rng_state_1.pth deleted file mode 100644 index 9a1bca1061cb9ecbb689954ed2b3c0139d4c0cc6..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8a3d8da1aa54796771be8e0f102c1ba0e9bce209cd7f83f5e4242dbd0a2bfb18 -size 27772 diff --git a/checkpoint-5000/rng_state_10.pth b/checkpoint-5000/rng_state_10.pth deleted file mode 100644 index 80b4833fb8614da8c7b43ce2dc83031e875990e0..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:263b9c81bf6b52324cce079cb862bf0c4c6c076726306fe430175760cf77ce1d -size 27789 diff --git a/checkpoint-5000/rng_state_11.pth b/checkpoint-5000/rng_state_11.pth deleted file mode 100644 index 55da8e031dda486a87150730f3c006a6fbbf5def..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bfd9622dd9c9e0f101a3891d78b76d8a750232389d97fff8a48e4ab0113e3bf0 -size 27789 diff --git a/checkpoint-5000/rng_state_12.pth b/checkpoint-5000/rng_state_12.pth deleted file mode 100644 index 5b5cb3c73161b8926eb77bc67dfb981462a009f7..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8b52b3225a4c307e1e07d040be377b2268078fb40662cf123cf14c9225dfc3d2 -size 27789 diff --git a/checkpoint-5000/rng_state_13.pth b/checkpoint-5000/rng_state_13.pth deleted file mode 100644 index 6dfe05530fcc36078e9ea3388e3129a9802a8105..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a7022a9a5c490e593972113d5eec0a181e018cdd0b74c023342974a3d2a43471 -size 27789 diff --git a/checkpoint-5000/rng_state_2.pth b/checkpoint-5000/rng_state_2.pth deleted file mode 100644 index 5cc368ebea4eb59351da0dda32d9a0191a27645a..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7ea427538851652ebb74224ead7e27e9853d1a0254ab5742c7f4e6a75f1a155b -size 27772 diff --git a/checkpoint-5000/rng_state_3.pth b/checkpoint-5000/rng_state_3.pth deleted file mode 100644 index 2653f6afc0753f4f0a4b58884924393c50bb80e6..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:84c0d3bf83700c5dcf78d4bca3c01d4661af97db85b1e1021458aa4ebf191dc3 -size 27772 diff --git a/checkpoint-5000/rng_state_4.pth b/checkpoint-5000/rng_state_4.pth deleted file mode 100644 index 17dbc94de833c85869043071ac3cf178e4029c25..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:88b40363540e71d8f1d1cd8dbf6a880e5a85fe8c36554f2c6a6e6bf87eeee7ef -size 27772 diff --git a/checkpoint-5000/rng_state_5.pth b/checkpoint-5000/rng_state_5.pth deleted file mode 100644 index df12ecaeda7900c0fd8445f8454fddbd7f69c384..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f452a098fe1f3d5946e80ca1866e99d8de678f832a877b5bd605c904adccd168 -size 27772 diff --git a/checkpoint-5000/rng_state_6.pth b/checkpoint-5000/rng_state_6.pth deleted file mode 100644 index e13e80df498039dec0d69c9dc155f6312a63f53f..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6329d34fc46a440591bbc38dc3e735aa628275c46bc5f5d67ea60d2ac817c9f -size 27772 diff --git a/checkpoint-5000/rng_state_7.pth b/checkpoint-5000/rng_state_7.pth deleted file mode 100644 index 065afb9b400ec0ab624b9e2e1bd15cd06cf59c21..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abc478444408d585c8510980bf6c3724dbd04c62fe3f44191f641810f4f2b408 -size 27772 diff --git a/checkpoint-5000/rng_state_8.pth b/checkpoint-5000/rng_state_8.pth deleted file mode 100644 index e358a2d86e15d530d6710914fdaeabf2e6ef4dbe..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:43a4f27fdaf452bec4190380281039b2452b0cc819d9babdb1883bb6338b79df -size 27772 diff --git a/checkpoint-5000/rng_state_9.pth b/checkpoint-5000/rng_state_9.pth deleted file mode 100644 index b723433adb48a109d110cdae4d73db16f086be84..0000000000000000000000000000000000000000 --- a/checkpoint-5000/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd492bc5d4f48c5532176ee3ad99275b5bfcd315a528c245cfa8d46477f6b13e -size 27772 diff --git a/checkpoint-5000/scheduler.pt b/checkpoint-5000/scheduler.pt deleted file mode 100644 index e2325daf95e132d92ec86f58b07155dcd7d36553..0000000000000000000000000000000000000000 --- a/checkpoint-5000/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:091fab5b44662db384d56b3c50422b403065ff0f62fb64f68c521ac3c38ad752 -size 627 diff --git a/checkpoint-5000/training_args.bin b/checkpoint-5000/training_args.bin deleted file mode 100644 index 3c48003adcc192172e325b8bb81af1b30fac42f7..0000000000000000000000000000000000000000 --- a/checkpoint-5000/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:354c4769acaf21317d8ab58ba2dd133763f3bee1aec7488fb334e45f3e80ebc3 -size 4027 diff --git a/checkpoint-5100/adapter_model.bin b/checkpoint-5100/adapter_model.bin deleted file mode 100644 index 02bfb0de2c8392b01220dbad54f7d5ef7442c98a..0000000000000000000000000000000000000000 --- a/checkpoint-5100/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0782e3c048e8ec06b53914deeacadabf30a533ab881541cd5057d49805c57014 -size 500897101 diff --git a/checkpoint-5100/adapter_model/adapter_model.bin b/checkpoint-5100/adapter_model/adapter_model.bin deleted file mode 100644 index 02bfb0de2c8392b01220dbad54f7d5ef7442c98a..0000000000000000000000000000000000000000 --- a/checkpoint-5100/adapter_model/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0782e3c048e8ec06b53914deeacadabf30a533ab881541cd5057d49805c57014 -size 500897101 diff --git a/checkpoint-5100/optimizer.pt b/checkpoint-5100/optimizer.pt deleted file mode 100644 index b21a87e8fcf3f6c85917ddfde8ff26a8760467d8..0000000000000000000000000000000000000000 --- a/checkpoint-5100/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6e547facfed70ca3ced4bba623ceed57a68ada7036877bcb0fe8abdc4206a71d -size 1001752701 diff --git a/checkpoint-5100/rng_state_0.pth b/checkpoint-5100/rng_state_0.pth deleted file mode 100644 index efec54a19ef3ffcf3a35e80a278a57708f8818e3..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:93586c7c2f4af77dae57306cefbbba6e501b56255a6e8ab1e51526e93247ec0c -size 27772 diff --git a/checkpoint-5100/rng_state_1.pth b/checkpoint-5100/rng_state_1.pth deleted file mode 100644 index 006f0ce77824e8757b2a54d97497a090e281f67f..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:914cd17a4d5c2393130506ee74b380b7ebf49b994b8e1f7f9a5a5011789dcb9d -size 27772 diff --git a/checkpoint-5100/rng_state_10.pth b/checkpoint-5100/rng_state_10.pth deleted file mode 100644 index e924e089f5bee9985719b31ab4d4899670b1c7b3..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f79575017a903227eead6d8ec8c987f6c9f113b02cc3fdca1a05e6dfeb87c263 -size 27789 diff --git a/checkpoint-5100/rng_state_11.pth b/checkpoint-5100/rng_state_11.pth deleted file mode 100644 index e74dbc2c8bb80a5090f72f29d5ad891986eb0b03..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e862437c6ef81136a36f5dcccf18047c8bf5b5ce5c4cb6a5de4068de8ac98fd4 -size 27789 diff --git a/checkpoint-5100/rng_state_12.pth b/checkpoint-5100/rng_state_12.pth deleted file mode 100644 index c4ea8e665565e1e4ce619c18c3cf32bbb8416f68..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2bd910734bd5ed0209fccf18e21529e6637d89e5d932f3863bdeb79c5a9955a0 -size 27789 diff --git a/checkpoint-5100/rng_state_13.pth b/checkpoint-5100/rng_state_13.pth deleted file mode 100644 index 4929b2e9b86f0460906db8eed7d1ab0156f238d2..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd706d0aeecfb525da3ab5daa901fe7638c2e7f5d4cee63cd71b6ca026275bdd -size 27789 diff --git a/checkpoint-5100/rng_state_2.pth b/checkpoint-5100/rng_state_2.pth deleted file mode 100644 index 5b6e339102453607790f1d3271c90300e1c20fb0..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a3cc4068be271200f493c6e5933125535d31c00d193a77baaf617e995cb80113 -size 27772 diff --git a/checkpoint-5100/rng_state_3.pth b/checkpoint-5100/rng_state_3.pth deleted file mode 100644 index 3af67e7908ee466fca4f247cb88787d6b60f095a..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:134ec8578ce099215e557b373586d1334dcba1f9bc3678e21e8a11c8293273b5 -size 27772 diff --git a/checkpoint-5100/rng_state_4.pth b/checkpoint-5100/rng_state_4.pth deleted file mode 100644 index 50ab2211005f0a24bf80d1ae93a75ee9073bedec..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2799584e6f3b97fb9250177cae1099c95a1a72f8c924828310d6e9c9f712a0ad -size 27772 diff --git a/checkpoint-5100/rng_state_5.pth b/checkpoint-5100/rng_state_5.pth deleted file mode 100644 index a237a79776db8339b3886a0cb5f1c1eed5125259..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d2d851757976cd5436fb4f7e4f6b90e86fd7eb7fd174ef2f06b786fab4c8b687 -size 27772 diff --git a/checkpoint-5100/rng_state_6.pth b/checkpoint-5100/rng_state_6.pth deleted file mode 100644 index d0dc6ec1565fb3615ece7b1a24b4c7980b69e39c..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0944f297f8c989eaaaa8748e1b4a866de5757e645fa13d826211ad5f9bf81798 -size 27772 diff --git a/checkpoint-5100/rng_state_7.pth b/checkpoint-5100/rng_state_7.pth deleted file mode 100644 index 3e592acb033fabefcc2e4a888058bfe7cff6aa4c..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f4847f06e89ac0c33e93f4108e29bba8a6a11b57185752e5a61d1d159db7176b -size 27772 diff --git a/checkpoint-5100/rng_state_8.pth b/checkpoint-5100/rng_state_8.pth deleted file mode 100644 index 7a5eb449223406d430f62368de0fca1b9ce65536..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:32e20dcbaf8912d2c4ea76cd78324e384e6e3f340b552198fd77b189a7f80400 -size 27772 diff --git a/checkpoint-5100/rng_state_9.pth b/checkpoint-5100/rng_state_9.pth deleted file mode 100644 index 7522bf2d591e25026b8beb76abbbeff66bef52b9..0000000000000000000000000000000000000000 --- a/checkpoint-5100/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6299cbf9ce668897a91d6363b1369a182cddf5e47a03415dbcb196480ea98de3 -size 27772 diff --git a/checkpoint-5100/scheduler.pt b/checkpoint-5100/scheduler.pt deleted file mode 100644 index b0b8abd7dade13ecdfafa417ba979fa207247f37..0000000000000000000000000000000000000000 --- a/checkpoint-5100/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:04c0158b55de3dc26efbfe9fb78f379b4093417c7720f3a9de19f86082d0caf3 -size 627 diff --git a/checkpoint-5100/training_args.bin b/checkpoint-5100/training_args.bin deleted file mode 100644 index 43b519cde185d2521e004dc718270044540f5e9c..0000000000000000000000000000000000000000 --- a/checkpoint-5100/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b5cc18faa1420e425c2fed06bfe2dd967461487c15531bd94429b7a3c0c02a49 -size 4027 diff --git a/checkpoint-5200/adapter_model.bin b/checkpoint-5200/adapter_model.bin deleted file mode 100644 index 4603cec9d970dae967d1fe03601443f982651c54..0000000000000000000000000000000000000000 --- a/checkpoint-5200/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:28c2d0c51dd5ec8f66ff0bbdb8ae6185bd1eca75e6b3b3409367c09446351f5a -size 500897101 diff --git a/checkpoint-5200/adapter_model/adapter_config.json b/checkpoint-5200/adapter_model/adapter_config.json deleted file mode 100644 index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..0000000000000000000000000000000000000000 --- a/checkpoint-5200/adapter_model/adapter_config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "auto_mapping": null, - "base_model_name_or_path": "/workspace/webui/models/TheBloke_Llama-2-13B-fp16", - "bias": "none", - "fan_in_fan_out": null, - "inference_mode": true, - "init_lora_weights": true, - "layers_pattern": null, - "layers_to_transform": null, - "lora_alpha": 16, - "lora_dropout": 0.05, - "modules_to_save": null, - "peft_type": "LORA", - "r": 32, - "revision": null, - "target_modules": [ - "v_proj", - "up_proj", - "k_proj", - "q_proj", - "down_proj", - "gate_proj", - "o_proj" - ], - "task_type": "CAUSAL_LM" -} \ No newline at end of file diff --git a/checkpoint-5200/adapter_model/adapter_model.bin b/checkpoint-5200/adapter_model/adapter_model.bin deleted file mode 100644 index 4603cec9d970dae967d1fe03601443f982651c54..0000000000000000000000000000000000000000 --- a/checkpoint-5200/adapter_model/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:28c2d0c51dd5ec8f66ff0bbdb8ae6185bd1eca75e6b3b3409367c09446351f5a -size 500897101 diff --git a/checkpoint-5200/optimizer.pt b/checkpoint-5200/optimizer.pt deleted file mode 100644 index 3bf258fce44f70ab030011d1d1bc825f78c75fe3..0000000000000000000000000000000000000000 --- a/checkpoint-5200/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:897aecb8fea53f1688ee40f5672ba9bf2f9263d05d96d719af5a024da878838c -size 1001752701 diff --git a/checkpoint-5200/rng_state_0.pth b/checkpoint-5200/rng_state_0.pth deleted file mode 100644 index 06dd14cb71f3b351e9ae50bdb44b62e88cde3b31..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7d3ab65c749e5fc734aff9ca0257ff2b5fbec92bf74548f706dd50a3522d9444 -size 27772 diff --git a/checkpoint-5200/rng_state_1.pth b/checkpoint-5200/rng_state_1.pth deleted file mode 100644 index 8b972a8eb856a661fcd533cae37605b2b2fb95f8..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0ac25dcd9dd77c6157fe871ffedc3311d277b0f3767923cc0debee8decbcac7c -size 27772 diff --git a/checkpoint-5200/rng_state_10.pth b/checkpoint-5200/rng_state_10.pth deleted file mode 100644 index eaf20c8bbef0790aa366c98de761027cb6f3de0a..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e8ef400cc06c347a4b973def87d07c600ccc0901bb7459cbac62d3b61528b1ea -size 27789 diff --git a/checkpoint-5200/rng_state_11.pth b/checkpoint-5200/rng_state_11.pth deleted file mode 100644 index b79a3c538aa7e18f090761946d884b3367298366..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:943fb5b9798db2076d7d142d97ef850652f063b322a6b291b70fd36b2873faee -size 27789 diff --git a/checkpoint-5200/rng_state_12.pth b/checkpoint-5200/rng_state_12.pth deleted file mode 100644 index 9987c8ffddad292a42cdc5894c097ac31c1d47d7..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4ba67e4d875ae627926fabe393d78116d78522c74be3715f12895caeb0451111 -size 27789 diff --git a/checkpoint-5200/rng_state_13.pth b/checkpoint-5200/rng_state_13.pth deleted file mode 100644 index 091de895d16cccb3c6da890b8639bad827edea90..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c1a40cb952561fb635e6a63b2e31f99fe76eb7379d5250b36d6ceae7607d513 -size 27789 diff --git a/checkpoint-5200/rng_state_2.pth b/checkpoint-5200/rng_state_2.pth deleted file mode 100644 index 081a4e852e0f8945fcf0c1bbe401c18bba590a86..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f49dff9815ef5438a07a8ce0274d35913fc7fd66a9c5e39708a3ed2f5a34531d -size 27772 diff --git a/checkpoint-5200/rng_state_3.pth b/checkpoint-5200/rng_state_3.pth deleted file mode 100644 index da61e91972422c74a684f9de7488fed4771a6d30..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d74211b2b26e9e6e27b2c293da7f898aff1fb43b386304ece8902e9e03cf6ea2 -size 27772 diff --git a/checkpoint-5200/rng_state_4.pth b/checkpoint-5200/rng_state_4.pth deleted file mode 100644 index bd87d2b76577161b6b76cdf9be44d998e91a208b..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f5969252b504ae24eacec7e5ddc1b6375bff73d3b276cd991e25169c2101ec3c -size 27772 diff --git a/checkpoint-5200/rng_state_5.pth b/checkpoint-5200/rng_state_5.pth deleted file mode 100644 index dab5412dfe05e034051e75149d46fe7c2e4409e3..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d96767afd301e0dfec9849df22aeb52b119511b35dae4fd79e1b3e8bab29d1b8 -size 27772 diff --git a/checkpoint-5200/rng_state_6.pth b/checkpoint-5200/rng_state_6.pth deleted file mode 100644 index e8d658bdb81092c1bac24484fd73ca8641c50917..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:25bc6e2e8c95bccdcf883e1283d17bb4645e87943be9d87983483a6e0ea62d19 -size 27772 diff --git a/checkpoint-5200/rng_state_7.pth b/checkpoint-5200/rng_state_7.pth deleted file mode 100644 index cef9722d3a1c0ad35789ef056eaa8bbfabe62e88..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:07239f8fab222d643c376b32e823fe2fa4e52c750e68bd07603feed81ab05f92 -size 27772 diff --git a/checkpoint-5200/rng_state_8.pth b/checkpoint-5200/rng_state_8.pth deleted file mode 100644 index 0bc0db080dd211eb9114f10f4d7d5860fcd1251b..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:126ef2192c7378d259ac9b7f6cc0f79e375ae619b07be1f34655a49f1c8090fa -size 27772 diff --git a/checkpoint-5200/rng_state_9.pth b/checkpoint-5200/rng_state_9.pth deleted file mode 100644 index dd196ac0cbfe92f452825a78370a30048b487390..0000000000000000000000000000000000000000 --- a/checkpoint-5200/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c655791adbb1473fdfbba3cd090a95b3182ba0fabeb7693d4b7675966dd0edc -size 27772 diff --git a/checkpoint-5200/scheduler.pt b/checkpoint-5200/scheduler.pt deleted file mode 100644 index 09b47cb01e336327b19380c7da592c19c4199ffc..0000000000000000000000000000000000000000 --- a/checkpoint-5200/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c657cc9c9f16f76f05d9497e2e29beeb126df858e2b635edfaa2b24e78fb2f61 -size 627 diff --git a/checkpoint-5200/training_args.bin b/checkpoint-5200/training_args.bin deleted file mode 100644 index 43b519cde185d2521e004dc718270044540f5e9c..0000000000000000000000000000000000000000 --- a/checkpoint-5200/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b5cc18faa1420e425c2fed06bfe2dd967461487c15531bd94429b7a3c0c02a49 -size 4027 diff --git a/checkpoint-5300/adapter_model.bin b/checkpoint-5300/adapter_model.bin deleted file mode 100644 index 3e8f72f386e2c3fe895fcb01c3f1de5f5fec965a..0000000000000000000000000000000000000000 --- a/checkpoint-5300/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:14ca48bd88a31002dc05f9274bc978bc8b5b8ae3e51470e74ee7bc0bb12284e9 -size 500897101 diff --git a/checkpoint-5300/optimizer.pt b/checkpoint-5300/optimizer.pt deleted file mode 100644 index 5b8133534a2b769e5c5d5403b729c67018470260..0000000000000000000000000000000000000000 --- a/checkpoint-5300/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:869a51ca719bee8b6aab465be97fa4ac5e228c769321c2712f644067ceeca076 -size 1001752701 diff --git a/checkpoint-5300/rng_state_0.pth b/checkpoint-5300/rng_state_0.pth deleted file mode 100644 index 552dc8ef95a545c64426e4c5711d142bd87b7760..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9267467db4bfc0b62f4b2992b98c478568d6b740025cdb5016f4102da1504163 -size 27772 diff --git a/checkpoint-5300/rng_state_1.pth b/checkpoint-5300/rng_state_1.pth deleted file mode 100644 index cf291739827b5154f004a189694861e364b08a68..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ea0db0e586ec1c1e547243b2e02d8b0d760f3d113e51420b567322fb80b86283 -size 27772 diff --git a/checkpoint-5300/rng_state_10.pth b/checkpoint-5300/rng_state_10.pth deleted file mode 100644 index 839a575806286f384bca65e6c6ed4b642fee5af0..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fcfb12512c0be896f0842434c14afaa23ede7d6aadbd83bfd18570859fcdecdd -size 27789 diff --git a/checkpoint-5300/rng_state_11.pth b/checkpoint-5300/rng_state_11.pth deleted file mode 100644 index 494cf039101c4fc79b0f4f48619b309ef5eeca44..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fcd57397386863534e25c2052e0eb5a3986965528e8332bead4e6da6c8a52a60 -size 27789 diff --git a/checkpoint-5300/rng_state_12.pth b/checkpoint-5300/rng_state_12.pth deleted file mode 100644 index d1ab254f55a9249593c17a205b750a8399f6942e..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3b494220b086ab33c457cd9cb3298d5707ae27861e1a1ea15cf7b2846c34edb3 -size 27789 diff --git a/checkpoint-5300/rng_state_13.pth b/checkpoint-5300/rng_state_13.pth deleted file mode 100644 index e7da07b270a41ff605eff193c3c775f63cefdf4b..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:66ddbbc44b73707a46dbe70a821775b9215bfb3188b97867dfd5d788f2c4bd1b -size 27789 diff --git a/checkpoint-5300/rng_state_2.pth b/checkpoint-5300/rng_state_2.pth deleted file mode 100644 index 8b750c8a0158ec37f230d464ed21d7088af86a15..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e09271dc29724c758580e8e6864e76555b7a1dd95ca5d0036f08cdd9f67fbaec -size 27772 diff --git a/checkpoint-5300/rng_state_3.pth b/checkpoint-5300/rng_state_3.pth deleted file mode 100644 index ec433ee7fc69d37df74002cecc5f6319b94e268f..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:65b0c519b8283902066db24d39bebbf0ec0f57d632779c56be9c9d58f7cdb78e -size 27772 diff --git a/checkpoint-5300/rng_state_4.pth b/checkpoint-5300/rng_state_4.pth deleted file mode 100644 index dc27c448e896fad22f68efc178f08e10e7431ab5..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:868a6a26d82f017652ee4b9e21c96ec36ab5f96be4eeedf65e27eda71ff93f25 -size 27772 diff --git a/checkpoint-5300/rng_state_5.pth b/checkpoint-5300/rng_state_5.pth deleted file mode 100644 index fa32e1f6b7712309b3c8943e87f2650e2c5a13cb..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d82c47d40cdc9cbed8bc1b1f8fdcb354fb8b6ac525cfce07fab2d1af5791c195 -size 27772 diff --git a/checkpoint-5300/rng_state_6.pth b/checkpoint-5300/rng_state_6.pth deleted file mode 100644 index 28ae8ef924932d456fd13a2995c8932487990c8e..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64d8ec328ebab19d4fa69241bbb5de66af7b09aa5f0d71d9e37be38a5170d24e -size 27772 diff --git a/checkpoint-5300/rng_state_7.pth b/checkpoint-5300/rng_state_7.pth deleted file mode 100644 index d9ecf5bafb7af425590b22c77078d9409670f728..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cf9d89caef032992b8f5efcdaf7ab987e37e4fb52ec8d47520f814092e1e7ab3 -size 27772 diff --git a/checkpoint-5300/rng_state_8.pth b/checkpoint-5300/rng_state_8.pth deleted file mode 100644 index 34110f26cf1c2d148a91aa260ddf93627bdc3069..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8913ebfea32419c486eaa9895c49a7962a44933cd37f4965710a3560fe737c25 -size 27772 diff --git a/checkpoint-5300/rng_state_9.pth b/checkpoint-5300/rng_state_9.pth deleted file mode 100644 index acee305b8ff2eb6687dabfd9c1220f25aacfff20..0000000000000000000000000000000000000000 --- a/checkpoint-5300/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:685f43d3417ce77333bd61cb9e79c3d6e0421bb659bae8689caafc6c6b0d8752 -size 27772 diff --git a/checkpoint-5300/scheduler.pt b/checkpoint-5300/scheduler.pt deleted file mode 100644 index c25a03466ceea6c5cb534559ebdfa7a51ae48c90..0000000000000000000000000000000000000000 --- a/checkpoint-5300/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0d904fb502ced275ef5e7925781f477f4c89d48daa60e9f45b9339adf1aaa77d -size 627 diff --git a/checkpoint-5000/README.md b/checkpoint-5400/README.md similarity index 100% rename from checkpoint-5000/README.md rename to checkpoint-5400/README.md diff --git a/checkpoint-5300/adapter_config.json b/checkpoint-5400/adapter_config.json similarity index 100% rename from checkpoint-5300/adapter_config.json rename to checkpoint-5400/adapter_config.json diff --git a/checkpoint-5400/adapter_model.bin b/checkpoint-5400/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd156ad5028e919f5cb218fb803514d02505cbc1 --- /dev/null +++ b/checkpoint-5400/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a996a2cd6511d12fe1f6c74e5551595b29964345d9c5913a1440514d20e74909 +size 500897101 diff --git a/checkpoint-5000/adapter_model/README.md b/checkpoint-5400/adapter_model/README.md similarity index 100% rename from checkpoint-5000/adapter_model/README.md rename to checkpoint-5400/adapter_model/README.md diff --git a/checkpoint-5000/adapter_config.json b/checkpoint-5400/adapter_model/adapter_config.json similarity index 100% rename from checkpoint-5000/adapter_config.json rename to checkpoint-5400/adapter_model/adapter_config.json index 2086dcb8a3bcbe9772b1971a2a24239b77070fbb..5b3f45c250ff330299d2364a46de0623dadd2f48 100644 --- a/checkpoint-5000/adapter_config.json +++ b/checkpoint-5400/adapter_model/adapter_config.json @@ -14,12 +14,12 @@ "r": 32, "revision": null, "target_modules": [ - "k_proj", + "q_proj", + "gate_proj", "o_proj", "down_proj", - "gate_proj", + "k_proj", "v_proj", - "q_proj", "up_proj" ], "task_type": "CAUSAL_LM" diff --git a/checkpoint-5400/adapter_model/adapter_model.bin b/checkpoint-5400/adapter_model/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd156ad5028e919f5cb218fb803514d02505cbc1 --- /dev/null +++ b/checkpoint-5400/adapter_model/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a996a2cd6511d12fe1f6c74e5551595b29964345d9c5913a1440514d20e74909 +size 500897101 diff --git a/checkpoint-5400/optimizer.pt b/checkpoint-5400/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7555b0c057bbcb347ed43d17da54abb9e1d8111d --- /dev/null +++ b/checkpoint-5400/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a049c191517e4cc2442d5e383237bf35c7e90159b14ee20f4ef3f1e917c94f7d +size 1001752701 diff --git a/checkpoint-5400/rng_state_0.pth b/checkpoint-5400/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..647a6426e65252cf43935d08344af7babeb064c0 --- /dev/null +++ b/checkpoint-5400/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb5c299ce12f96c89868d521ed520c7ace1a7a288b7b7a826d6e603aeb79a09 +size 27772 diff --git a/checkpoint-5400/rng_state_1.pth b/checkpoint-5400/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9724602cab7fc1a573eb5dfd68d8f25fd3ba9939 --- /dev/null +++ b/checkpoint-5400/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1b9ccab0a7c765a8ccd991c977a9ffc75c10546853ccb44210b37c9347c640 +size 27772 diff --git a/checkpoint-5400/rng_state_10.pth b/checkpoint-5400/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..022296ad01f7119105de863dfecde9f2e14fdc5b --- /dev/null +++ b/checkpoint-5400/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9597f7462f3230a6cbef5e02b36f74b70ccfcdcc850d8c7e131d92db196783 +size 27789 diff --git a/checkpoint-5400/rng_state_11.pth b/checkpoint-5400/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..56f555cbe7b4f5a0bfdd45d1c41592d5b3e9f922 --- /dev/null +++ b/checkpoint-5400/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8af70b0d7c5428460585eb71f0762f807411f8fcb9745d5f3d67da929bebac6 +size 27789 diff --git a/checkpoint-5400/rng_state_12.pth b/checkpoint-5400/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..1be68b3531c92a104382b223bcd2a5e21cdea62b --- /dev/null +++ b/checkpoint-5400/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6923f879a023dad7d6429c5f4ae2372fbd5ee6569ab6149a7cdae5b14fb3c3 +size 27789 diff --git a/checkpoint-5400/rng_state_13.pth b/checkpoint-5400/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..23988612a99f202bd1f90afecb4bb41fb555be99 --- /dev/null +++ b/checkpoint-5400/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5a179975104cf77a9e13a52a805da05b0e24a85d3849b0f5c3e5420f17eea8 +size 27789 diff --git a/checkpoint-5400/rng_state_2.pth b/checkpoint-5400/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..254c5961935c97254ef1f4227805b6f27c4edaea --- /dev/null +++ b/checkpoint-5400/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739e768c2ad37f578b983337dedf3c7558c279d10f81301e90d17df333839571 +size 27772 diff --git a/checkpoint-5400/rng_state_3.pth b/checkpoint-5400/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..03da82bdfdad227d441685f3eaef44508556a1be --- /dev/null +++ b/checkpoint-5400/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef2ea61eeb1cf909c75298fb11154372946533cb23888c32bb3d5dbf8f450be +size 27772 diff --git a/checkpoint-5400/rng_state_4.pth b/checkpoint-5400/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd14e28b48e5f9f2574ee0d75c78927f9119c929 --- /dev/null +++ b/checkpoint-5400/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0df83ddd7c2adb2cfaa37c8e8ef974c3ee5b10b047c9debb55e91b9c6abfa0 +size 27772 diff --git a/checkpoint-5400/rng_state_5.pth b/checkpoint-5400/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..07748b51d97d028c3487f01b56d39221b95d1fd8 --- /dev/null +++ b/checkpoint-5400/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d8090af65c1044a84f75fca5aaad6150338b890ba2ff8a597eb42e98730156 +size 27772 diff --git a/checkpoint-5400/rng_state_6.pth b/checkpoint-5400/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..7f8ad871dcef65ddc3c6d6c74943d5af367e93da --- /dev/null +++ b/checkpoint-5400/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39eb6a8461a3f8f64867ca24431f39e0c189f967e51fc06b1cd04b61557b7ab5 +size 27772 diff --git a/checkpoint-5400/rng_state_7.pth b/checkpoint-5400/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ca23cfac756660d83bdfb1aba90ee48188b0f64 --- /dev/null +++ b/checkpoint-5400/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c082109f0ab8381e4f9518c09cb1c66ba874df40524ab79671e907b2bae40124 +size 27772 diff --git a/checkpoint-5400/rng_state_8.pth b/checkpoint-5400/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0f7361e8b7974957dfa1528f4444566f026e19c --- /dev/null +++ b/checkpoint-5400/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09522662a1c7e523f238f6591ac23db965da78361158348b4370a4a0e5cadc9 +size 27772 diff --git a/checkpoint-5400/rng_state_9.pth b/checkpoint-5400/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..58b1b613012a8d080ec41d7e4c15bd56c5c5cec8 --- /dev/null +++ b/checkpoint-5400/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b144a36861671d0f406faba8754207d253d86202309d2a0cf2f6675277d4179 +size 27772 diff --git a/checkpoint-5400/scheduler.pt b/checkpoint-5400/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1be0e334dd83be886ca4f8fac072c80978e3367 --- /dev/null +++ b/checkpoint-5400/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced8c2de33809dd534295dd5742d2284a2f142b85e0e85a7f49385eb1bef7354 +size 627 diff --git a/checkpoint-5300/trainer_state.json b/checkpoint-5400/trainer_state.json similarity index 97% rename from checkpoint-5300/trainer_state.json rename to checkpoint-5400/trainer_state.json index 119d10f474474ee53860d56031071f00f9c5117c..2189af52f6e9c44add63f68f896d86aa0f21830e 100644 --- a/checkpoint-5300/trainer_state.json +++ b/checkpoint-5400/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 2.055060100814269, - "global_step": 5300, + "epoch": 2.093834819697557, + "global_step": 5400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1294,11 +1294,35 @@ "learning_rate": 4.519953408196152e-05, "loss": 0.7424, "step": 5300 + }, + { + "epoch": 2.06, + "learning_rate": 4.435215802306635e-05, + "loss": 0.7521, + "step": 5325 + }, + { + "epoch": 2.07, + "learning_rate": 4.351053109942894e-05, + "loss": 0.7477, + "step": 5350 + }, + { + "epoch": 2.08, + "learning_rate": 4.2674740261896776e-05, + "loss": 0.7456, + "step": 5375 + }, + { + "epoch": 2.09, + "learning_rate": 4.1844871858374844e-05, + "loss": 0.766, + "step": 5400 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.282482987033428e+19, + "total_flos": 2.325582880769573e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-5300/training_args.bin b/checkpoint-5400/training_args.bin similarity index 100% rename from checkpoint-5300/training_args.bin rename to checkpoint-5400/training_args.bin diff --git a/checkpoint-5100/README.md b/checkpoint-5500/README.md similarity index 100% rename from checkpoint-5100/README.md rename to checkpoint-5500/README.md diff --git a/checkpoint-5000/adapter_model/adapter_config.json b/checkpoint-5500/adapter_config.json similarity index 100% rename from checkpoint-5000/adapter_model/adapter_config.json rename to checkpoint-5500/adapter_config.json index 2086dcb8a3bcbe9772b1971a2a24239b77070fbb..5b3f45c250ff330299d2364a46de0623dadd2f48 100644 --- a/checkpoint-5000/adapter_model/adapter_config.json +++ b/checkpoint-5500/adapter_config.json @@ -14,12 +14,12 @@ "r": 32, "revision": null, "target_modules": [ - "k_proj", + "q_proj", + "gate_proj", "o_proj", "down_proj", - "gate_proj", + "k_proj", "v_proj", - "q_proj", "up_proj" ], "task_type": "CAUSAL_LM" diff --git a/checkpoint-5500/adapter_model.bin b/checkpoint-5500/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f25b271253aa1d3a3bd632c7016f808689db2a29 --- /dev/null +++ b/checkpoint-5500/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7243d5bc7b28d5d5a4bafb40fe933dd1f5d2b41c4b35311c4562dd50c5883a +size 500897101 diff --git a/checkpoint-5100/adapter_model/README.md b/checkpoint-5500/adapter_model/README.md similarity index 100% rename from checkpoint-5100/adapter_model/README.md rename to checkpoint-5500/adapter_model/README.md diff --git a/checkpoint-5100/adapter_config.json b/checkpoint-5500/adapter_model/adapter_config.json similarity index 94% rename from checkpoint-5100/adapter_config.json rename to checkpoint-5500/adapter_model/adapter_config.json index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..5b3f45c250ff330299d2364a46de0623dadd2f48 100644 --- a/checkpoint-5100/adapter_config.json +++ b/checkpoint-5500/adapter_model/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "v_proj", - "up_proj", - "k_proj", "q_proj", - "down_proj", "gate_proj", - "o_proj" + "o_proj", + "down_proj", + "k_proj", + "v_proj", + "up_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-5500/adapter_model/adapter_model.bin b/checkpoint-5500/adapter_model/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f25b271253aa1d3a3bd632c7016f808689db2a29 --- /dev/null +++ b/checkpoint-5500/adapter_model/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7243d5bc7b28d5d5a4bafb40fe933dd1f5d2b41c4b35311c4562dd50c5883a +size 500897101 diff --git a/checkpoint-5500/optimizer.pt b/checkpoint-5500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..9de25741384aed487c7fd491f6d7000ab7391a28 --- /dev/null +++ b/checkpoint-5500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80adf9c30a8a3ebab96b13b5000ed1b3eb4306228d36a12dfadc4e7cc433a4ec +size 1001752701 diff --git a/checkpoint-5500/rng_state_0.pth b/checkpoint-5500/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..375583ee0114caccc2517feebcce2c8d1c5bbef2 --- /dev/null +++ b/checkpoint-5500/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30e0a79fb2da13095943ed5d6ff4010e829f95de5b910b4f831e610487314e6f +size 27772 diff --git a/checkpoint-5500/rng_state_1.pth b/checkpoint-5500/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..54a3655e3b78b20585701028c092f2637fd2ce00 --- /dev/null +++ b/checkpoint-5500/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5459f0eefaad357478856f70446e39da7b343e17571839caaa8a02c194f7d669 +size 27772 diff --git a/checkpoint-5500/rng_state_10.pth b/checkpoint-5500/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..75a9f4a9e9fd3a7a62591d00ff06be84e71aea34 --- /dev/null +++ b/checkpoint-5500/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386be381ea58870ea29c419ee56fe49473c2a98987edeacf220a45b1a2223941 +size 27789 diff --git a/checkpoint-5500/rng_state_11.pth b/checkpoint-5500/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..b586bcfc5015187309aa7af69f45cbb254144307 --- /dev/null +++ b/checkpoint-5500/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e40b2e53f6a7d00bfd79e9648b446e522e5f1b008a72d0ecf49f8afaa037c8 +size 27789 diff --git a/checkpoint-5500/rng_state_12.pth b/checkpoint-5500/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..c29c388f13f32dae9c32e4c071fda464405a9322 --- /dev/null +++ b/checkpoint-5500/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800d188559c734beb02115217b063e8bb6cb7259475ac5e72045222c4e97d3ae +size 27789 diff --git a/checkpoint-5500/rng_state_13.pth b/checkpoint-5500/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ba5ed295cf29346055bdd5cf0eafe42825ef71a --- /dev/null +++ b/checkpoint-5500/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675b5fc0a7deb4335cae143f3a24d62ea65052ce52feb5d15793418be4662ac8 +size 27789 diff --git a/checkpoint-5500/rng_state_2.pth b/checkpoint-5500/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4680c515e6a46cff17f2e62d732fb07f95ab77ba --- /dev/null +++ b/checkpoint-5500/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6acf616edcf44f8c9ecee1675d30b9f4f2d2de918203c9ebb49e8a44b17d57c +size 27772 diff --git a/checkpoint-5500/rng_state_3.pth b/checkpoint-5500/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..64ec2a11029a7441175ee5542c99c46dc5619f04 --- /dev/null +++ b/checkpoint-5500/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a7c589905769b0dbc43278783063253c4361403cb5e93a12c744d0c001f090 +size 27772 diff --git a/checkpoint-5500/rng_state_4.pth b/checkpoint-5500/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..5227670a97240c57e138f4d60872d572b75fc996 --- /dev/null +++ b/checkpoint-5500/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eca9eeb1ff3b7857657d5e2e3990c3de3e6f2dc13c394c9ae206a0dc471b87a +size 27772 diff --git a/checkpoint-5500/rng_state_5.pth b/checkpoint-5500/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..8a33ed4598f2324bbe058926b7491927b7b77932 --- /dev/null +++ b/checkpoint-5500/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17e2394c1de98b9b25d7d58415327217900745e09f7ab9276a36f8c4ea50f4f +size 27772 diff --git a/checkpoint-5500/rng_state_6.pth b/checkpoint-5500/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca5795980d78ac96cd5daf1bdf5c0858e8b2a832 --- /dev/null +++ b/checkpoint-5500/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1131467c982915441e4d4625565d4d9601fd3f17521d48e909b1e53bfaff94c +size 27772 diff --git a/checkpoint-5500/rng_state_7.pth b/checkpoint-5500/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb891e32df8c55a1398132e80f30d6e272792afb --- /dev/null +++ b/checkpoint-5500/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293b86ebb5ed10caa66ef5329f9bec84416b4637fe61389a51d73c4026771d2c +size 27772 diff --git a/checkpoint-5500/rng_state_8.pth b/checkpoint-5500/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..acd4ffee7fb61ee99058b6beda1331dcd5f97e75 --- /dev/null +++ b/checkpoint-5500/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686f925d57ef5c5206a88fc40e5fc96231e3bf44a2a0b7213509ab2181ee4b8f +size 27772 diff --git a/checkpoint-5500/rng_state_9.pth b/checkpoint-5500/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..078b89d1d2eb8b5500cfe358a93cf0ab5b560d5c --- /dev/null +++ b/checkpoint-5500/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f2aba6953f527967beec2652c8b9c0bb338e770c0158e5e0f3e5100d0f7bc63 +size 27772 diff --git a/checkpoint-5500/scheduler.pt b/checkpoint-5500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a13f5f4b1c314e1988588849c40d157694f99e3a --- /dev/null +++ b/checkpoint-5500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceeb3b5fc20812592b97207e07386031eb6265ebb23202022487dfc5a6412586 +size 627 diff --git a/checkpoint-5200/trainer_state.json b/checkpoint-5500/trainer_state.json similarity index 94% rename from checkpoint-5200/trainer_state.json rename to checkpoint-5500/trainer_state.json index 97b3abd665702c8773f0ea57e83d10c932db6f9d..e329e3c79569c013bed16a6058c7908dcf40a6a7 100644 --- a/checkpoint-5200/trainer_state.json +++ b/checkpoint-5500/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 2.016285381930981, - "global_step": 5200, + "epoch": 2.1326095385808452, + "global_step": 5500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1270,11 +1270,83 @@ "learning_rate": 4.864477005494938e-05, "loss": 0.7654, "step": 5200 + }, + { + "epoch": 2.03, + "learning_rate": 4.777527870665592e-05, + "loss": 0.7468, + "step": 5225 + }, + { + "epoch": 2.04, + "learning_rate": 4.691118284138296e-05, + "loss": 0.7359, + "step": 5250 + }, + { + "epoch": 2.05, + "learning_rate": 4.605257173130763e-05, + "loss": 0.7422, + "step": 5275 + }, + { + "epoch": 2.06, + "learning_rate": 4.519953408196152e-05, + "loss": 0.7424, + "step": 5300 + }, + { + "epoch": 2.06, + "learning_rate": 4.435215802306635e-05, + "loss": 0.7521, + "step": 5325 + }, + { + "epoch": 2.07, + "learning_rate": 4.351053109942894e-05, + "loss": 0.7477, + "step": 5350 + }, + { + "epoch": 2.08, + "learning_rate": 4.2674740261896776e-05, + "loss": 0.7456, + "step": 5375 + }, + { + "epoch": 2.09, + "learning_rate": 4.1844871858374844e-05, + "loss": 0.766, + "step": 5400 + }, + { + "epoch": 2.1, + "learning_rate": 4.1021011624904814e-05, + "loss": 0.7664, + "step": 5425 + }, + { + "epoch": 2.11, + "learning_rate": 4.0203244676807353e-05, + "loss": 0.7703, + "step": 5450 + }, + { + "epoch": 2.12, + "learning_rate": 3.939165549988873e-05, + "loss": 0.7674, + "step": 5475 + }, + { + "epoch": 2.13, + "learning_rate": 3.858632794171222e-05, + "loss": 0.7722, + "step": 5500 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.2394545727200035e+19, + "total_flos": 2.3687017848899633e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-5500/training_args.bin b/checkpoint-5500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1 --- /dev/null +++ b/checkpoint-5500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6 +size 4027 diff --git a/checkpoint-5200/README.md b/checkpoint-5600/README.md similarity index 100% rename from checkpoint-5200/README.md rename to checkpoint-5600/README.md diff --git a/checkpoint-5100/adapter_model/adapter_config.json b/checkpoint-5600/adapter_config.json similarity index 94% rename from checkpoint-5100/adapter_model/adapter_config.json rename to checkpoint-5600/adapter_config.json index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..5b3f45c250ff330299d2364a46de0623dadd2f48 100644 --- a/checkpoint-5100/adapter_model/adapter_config.json +++ b/checkpoint-5600/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "v_proj", - "up_proj", - "k_proj", "q_proj", - "down_proj", "gate_proj", - "o_proj" + "o_proj", + "down_proj", + "k_proj", + "v_proj", + "up_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-5600/adapter_model.bin b/checkpoint-5600/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..427abc5179a9c1573bde250175a84acdb13acb5a --- /dev/null +++ b/checkpoint-5600/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96ff867e21cc9653b08a6604c2b9fee34b49567f39bc3b5219920c59a1ad479 +size 500897101 diff --git a/checkpoint-5200/adapter_model/README.md b/checkpoint-5600/adapter_model/README.md similarity index 100% rename from checkpoint-5200/adapter_model/README.md rename to checkpoint-5600/adapter_model/README.md diff --git a/checkpoint-5600/adapter_model/adapter_config.json b/checkpoint-5600/adapter_model/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b3f45c250ff330299d2364a46de0623dadd2f48 --- /dev/null +++ b/checkpoint-5600/adapter_model/adapter_config.json @@ -0,0 +1,26 @@ +{ + "auto_mapping": null, + "base_model_name_or_path": "/workspace/webui/models/TheBloke_Llama-2-13B-fp16", + "bias": "none", + "fan_in_fan_out": null, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 16, + "lora_dropout": 0.05, + "modules_to_save": null, + "peft_type": "LORA", + "r": 32, + "revision": null, + "target_modules": [ + "q_proj", + "gate_proj", + "o_proj", + "down_proj", + "k_proj", + "v_proj", + "up_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-5600/adapter_model/adapter_model.bin b/checkpoint-5600/adapter_model/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..427abc5179a9c1573bde250175a84acdb13acb5a --- /dev/null +++ b/checkpoint-5600/adapter_model/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96ff867e21cc9653b08a6604c2b9fee34b49567f39bc3b5219920c59a1ad479 +size 500897101 diff --git a/checkpoint-5600/optimizer.pt b/checkpoint-5600/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0fbdf4d0a53fbf8f9394431ee4fb0d3982604ec --- /dev/null +++ b/checkpoint-5600/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df47db77572b5903eee04a46dab5d058c91d6beb23a0c788c4e7a5ff96c06106 +size 1001752701 diff --git a/checkpoint-5600/rng_state_0.pth b/checkpoint-5600/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..400f0b99223b4a2b6ff573b6179ecd47f631f0ab --- /dev/null +++ b/checkpoint-5600/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2649527449cc7bab876f24864f3a04b696ce2041881461ec304e8e720f5c2731 +size 27772 diff --git a/checkpoint-5600/rng_state_1.pth b/checkpoint-5600/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2be91acf27fb464aec769cdf1ae4ca2e704c738a --- /dev/null +++ b/checkpoint-5600/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae037bf942f3d5243bbe7c3db837eb84dcd51095ec0ba382f43a17d0c0c87f5b +size 27772 diff --git a/checkpoint-5600/rng_state_10.pth b/checkpoint-5600/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..e59ba6d28072b1c441e071b56698aac69fed5117 --- /dev/null +++ b/checkpoint-5600/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d09be680de783308c5b6c5c5c75f1cf1b7e91ec7dbf0ccc24e0e1adea4c8acd +size 27789 diff --git a/checkpoint-5600/rng_state_11.pth b/checkpoint-5600/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..9de92cb383dcef1347b179fe9b8d5ec38ee15c3e --- /dev/null +++ b/checkpoint-5600/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72fe3e4408208255a5fc68fcce1f01d10c7f1eae3f2c7548666160ee70f0e6aa +size 27789 diff --git a/checkpoint-5600/rng_state_12.pth b/checkpoint-5600/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c5dfd7ae4a944d2633a0f570b01b0eb9cbda76e --- /dev/null +++ b/checkpoint-5600/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0960c791386b2315bfdb5dc6eb00805451f82b5884e14fa0e8b5f9e824859ff +size 27789 diff --git a/checkpoint-5600/rng_state_13.pth b/checkpoint-5600/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..7691410b7970e8c4b5c94ebe8b13e01319206818 --- /dev/null +++ b/checkpoint-5600/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:732bbec507cf39b6e24310e2184b2d9b1837e907f6677563fd5c6f9891d7a8de +size 27789 diff --git a/checkpoint-5600/rng_state_2.pth b/checkpoint-5600/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d392ab1a2e830ddde436953957e80c79a7077ed --- /dev/null +++ b/checkpoint-5600/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce44f1432aaa2d64261a1f7fbc6a5482030d9f8a9fffc628a7cdebce9ee27a6 +size 27772 diff --git a/checkpoint-5600/rng_state_3.pth b/checkpoint-5600/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ead0be94ffa333db9e7905e81a8fa62d2bad5d69 --- /dev/null +++ b/checkpoint-5600/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c025a89c9d90fd82a35542e443baf062744f6456e92fe3bcf602fa5825c4f3e +size 27772 diff --git a/checkpoint-5600/rng_state_4.pth b/checkpoint-5600/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..78f05a6a3410eb5c9db1d7e3137a8e56044e95b9 --- /dev/null +++ b/checkpoint-5600/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a516cb688f1dc31792fb91446d23ded3a5796e4dc99dd525d9bac5f9dc529c35 +size 27772 diff --git a/checkpoint-5600/rng_state_5.pth b/checkpoint-5600/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..76f3854f263fe2c261868a0160dd999cb2499026 --- /dev/null +++ b/checkpoint-5600/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7823690621e69b2981b133b63eb5a80a23490616d48dc63cb760e86e38604a +size 27772 diff --git a/checkpoint-5600/rng_state_6.pth b/checkpoint-5600/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b5aaf73005a165301ae66b9dc4272d38c4ec85b --- /dev/null +++ b/checkpoint-5600/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18df96fd55552e3861ed458fc798b0c3920f65c1ce37c6cc620c9e50505a7e09 +size 27772 diff --git a/checkpoint-5600/rng_state_7.pth b/checkpoint-5600/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..19412ea18371d748e653a42aba6abeaedfa8bbc1 --- /dev/null +++ b/checkpoint-5600/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f81d3438f9d778b8103678ab771741f7b2225c3019a7cfc2e9c229006c5413 +size 27772 diff --git a/checkpoint-5600/rng_state_8.pth b/checkpoint-5600/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..83f0aaf0a98801f5e36eaaf7c376c438f1e7f02b --- /dev/null +++ b/checkpoint-5600/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5b70e93fcc996c03cc042b239463bcc53073b6d9ed06b24e1269d510cb89df +size 27772 diff --git a/checkpoint-5600/rng_state_9.pth b/checkpoint-5600/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..0b891a65ce49471ffa81bef6f5673197f206205c --- /dev/null +++ b/checkpoint-5600/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90f3084f765b30672ebf421b021b4022b5f3d36076be9073a91796e1a6089b1 +size 27772 diff --git a/checkpoint-5600/scheduler.pt b/checkpoint-5600/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd78806480121e3ea9f28152ce36ad0e0f05faa --- /dev/null +++ b/checkpoint-5600/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b513b0465d40001c6314a5a4b4dc290c6baefd28e2877ca89d7e28757ae1791 +size 627 diff --git a/checkpoint-5100/trainer_state.json b/checkpoint-5600/trainer_state.json similarity index 91% rename from checkpoint-5100/trainer_state.json rename to checkpoint-5600/trainer_state.json index 31f9ead56164f53bb88ae75076a62bb58974bed0..0f4cbe52d86850b9d7cc6d7dd5bb106474d0cae3 100644 --- a/checkpoint-5100/trainer_state.json +++ b/checkpoint-5600/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 1.9775106630476929, - "global_step": 5100, + "epoch": 2.1713842574641333, + "global_step": 5600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1246,11 +1246,131 @@ "learning_rate": 5.21748855202839e-05, "loss": 0.7868, "step": 5100 + }, + { + "epoch": 1.99, + "learning_rate": 5.128471597058342e-05, + "loss": 0.7993, + "step": 5125 + }, + { + "epoch": 2.0, + "learning_rate": 5.03995793340572e-05, + "loss": 0.7892, + "step": 5150 + }, + { + "epoch": 2.01, + "learning_rate": 4.9519567056663694e-05, + "loss": 0.7788, + "step": 5175 + }, + { + "epoch": 2.02, + "learning_rate": 4.864477005494938e-05, + "loss": 0.7654, + "step": 5200 + }, + { + "epoch": 2.03, + "learning_rate": 4.777527870665592e-05, + "loss": 0.7468, + "step": 5225 + }, + { + "epoch": 2.04, + "learning_rate": 4.691118284138296e-05, + "loss": 0.7359, + "step": 5250 + }, + { + "epoch": 2.05, + "learning_rate": 4.605257173130763e-05, + "loss": 0.7422, + "step": 5275 + }, + { + "epoch": 2.06, + "learning_rate": 4.519953408196152e-05, + "loss": 0.7424, + "step": 5300 + }, + { + "epoch": 2.06, + "learning_rate": 4.435215802306635e-05, + "loss": 0.7521, + "step": 5325 + }, + { + "epoch": 2.07, + "learning_rate": 4.351053109942894e-05, + "loss": 0.7477, + "step": 5350 + }, + { + "epoch": 2.08, + "learning_rate": 4.2674740261896776e-05, + "loss": 0.7456, + "step": 5375 + }, + { + "epoch": 2.09, + "learning_rate": 4.1844871858374844e-05, + "loss": 0.766, + "step": 5400 + }, + { + "epoch": 2.1, + "learning_rate": 4.1021011624904814e-05, + "loss": 0.7664, + "step": 5425 + }, + { + "epoch": 2.11, + "learning_rate": 4.0203244676807353e-05, + "loss": 0.7703, + "step": 5450 + }, + { + "epoch": 2.12, + "learning_rate": 3.939165549988873e-05, + "loss": 0.7674, + "step": 5475 + }, + { + "epoch": 2.13, + "learning_rate": 3.858632794171222e-05, + "loss": 0.7722, + "step": 5500 + }, + { + "epoch": 2.14, + "learning_rate": 3.778734520293562e-05, + "loss": 0.7716, + "step": 5525 + }, + { + "epoch": 2.15, + "learning_rate": 3.699478982871561e-05, + "loss": 0.7795, + "step": 5550 + }, + { + "epoch": 2.16, + "learning_rate": 3.62087437001797e-05, + "loss": 0.7728, + "step": 5575 + }, + { + "epoch": 2.17, + "learning_rate": 3.5429288025966944e-05, + "loss": 0.7709, + "step": 5600 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.1963895120276226e+19, + "total_flos": 2.4117470741298938e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-5600/training_args.bin b/checkpoint-5600/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1 --- /dev/null +++ b/checkpoint-5600/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6 +size 4027 diff --git a/checkpoint-5300/README.md b/checkpoint-5700/README.md similarity index 100% rename from checkpoint-5300/README.md rename to checkpoint-5700/README.md diff --git a/checkpoint-5200/adapter_config.json b/checkpoint-5700/adapter_config.json similarity index 94% rename from checkpoint-5200/adapter_config.json rename to checkpoint-5700/adapter_config.json index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..7052646debaf453de93d6176727714122c31b64a 100644 --- a/checkpoint-5200/adapter_config.json +++ b/checkpoint-5700/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ + "q_proj", "v_proj", + "gate_proj", "up_proj", + "o_proj", "k_proj", - "q_proj", - "down_proj", - "gate_proj", - "o_proj" + "down_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-5700/adapter_model.bin b/checkpoint-5700/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..02526e93c7101a3c9d0727acfe024831696398f1 --- /dev/null +++ b/checkpoint-5700/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95 +size 500897101 diff --git a/checkpoint-5700/optimizer.pt b/checkpoint-5700/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3c8aee3e9ab00a5c3caededd68fa2b6406534b --- /dev/null +++ b/checkpoint-5700/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8847b7875d322ad5570a300587a0f3924a360ae4df3e2feeb97a8a2e21a3cbff +size 1001752701 diff --git a/checkpoint-5700/rng_state_0.pth b/checkpoint-5700/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c2a9137bfd1f9c3efd5228cb92aa36dc82cc29a --- /dev/null +++ b/checkpoint-5700/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06ce8fd6a33ec4407e0888bbcc8c7e40f4d820c9b7b7024f808c1cb08bac1f9 +size 27772 diff --git a/checkpoint-5700/rng_state_1.pth b/checkpoint-5700/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..07bb8ba3171f9114ca378631f850b16a8ca02a83 --- /dev/null +++ b/checkpoint-5700/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218ef7d643b85f18451d0ff4e11963ac2483f153fb71cc3ca1ab2bc1c0c67051 +size 27772 diff --git a/checkpoint-5700/rng_state_10.pth b/checkpoint-5700/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..62f27578ae3c5f05071b9cf5c702eeb81bc6d415 --- /dev/null +++ b/checkpoint-5700/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d52fed50c25d75d7fa962b9f10f71f848700ff11f9305a37b16ca126fee5481 +size 27789 diff --git a/checkpoint-5700/rng_state_11.pth b/checkpoint-5700/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2efdd8e880e555c19f213e77989c03985c1fd8a --- /dev/null +++ b/checkpoint-5700/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4cdcdc956f43b62d0d18dc1d662748eb79bf6714c90145fc90101a1ea2249d +size 27789 diff --git a/checkpoint-5700/rng_state_12.pth b/checkpoint-5700/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..35ffc9df08e4edd6abf3d1d242d2d90918445da0 --- /dev/null +++ b/checkpoint-5700/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8305db4caf39e6fd5e1f06f849d2a6d65681cf5c367dd8a754a886f1d32d4456 +size 27789 diff --git a/checkpoint-5700/rng_state_13.pth b/checkpoint-5700/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..9951d89ea973b30e68cd7319d1009ce908729213 --- /dev/null +++ b/checkpoint-5700/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9d3dc3cf0abd594c579dd75cbe79170df6d02cec6c38d47e042b3dd26300d9 +size 27789 diff --git a/checkpoint-5700/rng_state_2.pth b/checkpoint-5700/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d36198d13637177c88509187eec27963707dbc4 --- /dev/null +++ b/checkpoint-5700/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348612a8cf3a488b2de324430f631e10c4e8156112e6c50cecda44157e829595 +size 27772 diff --git a/checkpoint-5700/rng_state_3.pth b/checkpoint-5700/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f72210cf61d845505e06c0f681a11f782d2d543 --- /dev/null +++ b/checkpoint-5700/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c688a5f058c380a72ea06519f8b004106c3bf62f4ac8ae5b0e96c473dbac963c +size 27772 diff --git a/checkpoint-5700/rng_state_4.pth b/checkpoint-5700/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..062d0bace80c1db35317fbd29fd2698c02cb8cd8 --- /dev/null +++ b/checkpoint-5700/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ebd3abf1496a95cb8a1cc494c974137f7880bb1069b7813817b8600444464d +size 27772 diff --git a/checkpoint-5700/rng_state_5.pth b/checkpoint-5700/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..337c9b58db07231bee27e8d458d57f2f970e7da4 --- /dev/null +++ b/checkpoint-5700/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ad3339005efdbfae3bb272ea3ce0907371f54b4834a96fa9c864807063f63d +size 27772 diff --git a/checkpoint-5700/rng_state_6.pth b/checkpoint-5700/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6b7bdf4e47fc358d7c2daa8c1e04e4eae152289 --- /dev/null +++ b/checkpoint-5700/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f13556a5091d1d8f3874fe4a97ac3fc222b586812ceab6167e99bc25dc28fc0 +size 27772 diff --git a/checkpoint-5700/rng_state_7.pth b/checkpoint-5700/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2beb3e1bd8f4fe6a018c96e8cc80233ad1384b9 --- /dev/null +++ b/checkpoint-5700/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b76a223c2ea9e5262b69fc056b9f29e0dd62a728f58a99ac77374aeb72fce68 +size 27772 diff --git a/checkpoint-5700/rng_state_8.pth b/checkpoint-5700/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..73e55c77fc49eb5929193d73402cd3d20c1f563e --- /dev/null +++ b/checkpoint-5700/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae0f14b82c516564368a80f0d993ef826bf389434bdd326ac982efc3e52dc286 +size 27772 diff --git a/checkpoint-5700/rng_state_9.pth b/checkpoint-5700/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7da4b43531a42c31650b4c283559a7d8f311a95 --- /dev/null +++ b/checkpoint-5700/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff589c2de9aa0e8b005f5e548e65245c51b773411b16d01c505e9d491673af3f +size 27772 diff --git a/checkpoint-5700/scheduler.pt b/checkpoint-5700/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e36ca6a96764eeccb6aa7d9c5028585fed23370 --- /dev/null +++ b/checkpoint-5700/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:935f0139e1e2ffb90e75a6a1904fe50b37854f0d00a6d9b7dc07c85fc7a0d97c +size 627 diff --git a/checkpoint-5000/trainer_state.json b/checkpoint-5700/trainer_state.json similarity index 87% rename from checkpoint-5000/trainer_state.json rename to checkpoint-5700/trainer_state.json index af780eb13311ced739f9badd8713c039b76bfa10..8c4091dad201566e2ffa5b495ce638f306686a5e 100644 --- a/checkpoint-5000/trainer_state.json +++ b/checkpoint-5700/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 1.9387359441644048, - "global_step": 5000, + "epoch": 2.2101589763474214, + "global_step": 5700, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1222,11 +1222,179 @@ "eval_samples_per_second": 12.251, "eval_steps_per_second": 0.889, "step": 5000 + }, + { + "epoch": 1.95, + "learning_rate": 5.487466944644033e-05, + "loss": 0.7902, + "step": 5025 + }, + { + "epoch": 1.96, + "learning_rate": 5.3969954985052996e-05, + "loss": 0.7979, + "step": 5050 + }, + { + "epoch": 1.97, + "learning_rate": 5.306999601723579e-05, + "loss": 0.7931, + "step": 5075 + }, + { + "epoch": 1.98, + "learning_rate": 5.21748855202839e-05, + "loss": 0.7868, + "step": 5100 + }, + { + "epoch": 1.99, + "learning_rate": 5.128471597058342e-05, + "loss": 0.7993, + "step": 5125 + }, + { + "epoch": 2.0, + "learning_rate": 5.03995793340572e-05, + "loss": 0.7892, + "step": 5150 + }, + { + "epoch": 2.01, + "learning_rate": 4.9519567056663694e-05, + "loss": 0.7788, + "step": 5175 + }, + { + "epoch": 2.02, + "learning_rate": 4.864477005494938e-05, + "loss": 0.7654, + "step": 5200 + }, + { + "epoch": 2.03, + "learning_rate": 4.777527870665592e-05, + "loss": 0.7468, + "step": 5225 + }, + { + "epoch": 2.04, + "learning_rate": 4.691118284138296e-05, + "loss": 0.7359, + "step": 5250 + }, + { + "epoch": 2.05, + "learning_rate": 4.605257173130763e-05, + "loss": 0.7422, + "step": 5275 + }, + { + "epoch": 2.06, + "learning_rate": 4.519953408196152e-05, + "loss": 0.7424, + "step": 5300 + }, + { + "epoch": 2.06, + "learning_rate": 4.435215802306635e-05, + "loss": 0.7521, + "step": 5325 + }, + { + "epoch": 2.07, + "learning_rate": 4.351053109942894e-05, + "loss": 0.7477, + "step": 5350 + }, + { + "epoch": 2.08, + "learning_rate": 4.2674740261896776e-05, + "loss": 0.7456, + "step": 5375 + }, + { + "epoch": 2.09, + "learning_rate": 4.1844871858374844e-05, + "loss": 0.766, + "step": 5400 + }, + { + "epoch": 2.1, + "learning_rate": 4.1021011624904814e-05, + "loss": 0.7664, + "step": 5425 + }, + { + "epoch": 2.11, + "learning_rate": 4.0203244676807353e-05, + "loss": 0.7703, + "step": 5450 + }, + { + "epoch": 2.12, + "learning_rate": 3.939165549988873e-05, + "loss": 0.7674, + "step": 5475 + }, + { + "epoch": 2.13, + "learning_rate": 3.858632794171222e-05, + "loss": 0.7722, + "step": 5500 + }, + { + "epoch": 2.14, + "learning_rate": 3.778734520293562e-05, + "loss": 0.7716, + "step": 5525 + }, + { + "epoch": 2.15, + "learning_rate": 3.699478982871561e-05, + "loss": 0.7795, + "step": 5550 + }, + { + "epoch": 2.16, + "learning_rate": 3.62087437001797e-05, + "loss": 0.7728, + "step": 5575 + }, + { + "epoch": 2.17, + "learning_rate": 3.5429288025966944e-05, + "loss": 0.7709, + "step": 5600 + }, + { + "epoch": 2.18, + "learning_rate": 3.4656503333837956e-05, + "loss": 0.7682, + "step": 5625 + }, + { + "epoch": 2.19, + "learning_rate": 3.389046946235542e-05, + "loss": 0.7734, + "step": 5650 + }, + { + "epoch": 2.2, + "learning_rate": 3.313126555263576e-05, + "loss": 0.7716, + "step": 5675 + }, + { + "epoch": 2.21, + "learning_rate": 3.237897004017276e-05, + "loss": 0.7716, + "step": 5700 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.1532695573582316e+19, + "total_flos": 2.4549667828507083e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-5700/training_args.bin b/checkpoint-5700/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..c456116f688fe6cb6deecb1e0a1cf8d153d349fb --- /dev/null +++ b/checkpoint-5700/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2 +size 4027 diff --git a/training_args.bin b/training_args.bin index ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1..c456116f688fe6cb6deecb1e0a1cf8d153d349fb 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6 +oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2 size 4027