diff --git a/adapter_config.json b/adapter_config.json
index 5b3f45c250ff330299d2364a46de0623dadd2f48..7052646debaf453de93d6176727714122c31b64a 100644
--- a/adapter_config.json
+++ b/adapter_config.json
@@ -15,12 +15,12 @@
   "revision": null,
   "target_modules": [
     "q_proj",
+    "v_proj",
     "gate_proj",
+    "up_proj",
     "o_proj",
-    "down_proj",
     "k_proj",
-    "v_proj",
-    "up_proj"
+    "down_proj"
   ],
   "task_type": "CAUSAL_LM"
 }
\ No newline at end of file
diff --git a/adapter_model.bin b/adapter_model.bin
index 3e8f72f386e2c3fe895fcb01c3f1de5f5fec965a..02526e93c7101a3c9d0727acfe024831696398f1 100644
--- a/adapter_model.bin
+++ b/adapter_model.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:14ca48bd88a31002dc05f9274bc978bc8b5b8ae3e51470e74ee7bc0bb12284e9
+oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95
 size 500897101
diff --git a/checkpoint-5000/adapter_model.bin b/checkpoint-5000/adapter_model.bin
deleted file mode 100644
index 74814d55a55053c55b191f943aebee3639caff0a..0000000000000000000000000000000000000000
--- a/checkpoint-5000/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:658b9b2dec5afef11956f93a69d1e5899dfaf7ec45314dbb9a4f4fe9a8d341ef
-size 500897101
diff --git a/checkpoint-5000/adapter_model/adapter_model.bin b/checkpoint-5000/adapter_model/adapter_model.bin
deleted file mode 100644
index 74814d55a55053c55b191f943aebee3639caff0a..0000000000000000000000000000000000000000
--- a/checkpoint-5000/adapter_model/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:658b9b2dec5afef11956f93a69d1e5899dfaf7ec45314dbb9a4f4fe9a8d341ef
-size 500897101
diff --git a/checkpoint-5000/optimizer.pt b/checkpoint-5000/optimizer.pt
deleted file mode 100644
index 8707c624320e26944a53fa9f047051d0b513a55d..0000000000000000000000000000000000000000
--- a/checkpoint-5000/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:41a19364f98039f3de4a4fce0e0896ae1c403fab5b0de5a6478b8b3154215366
-size 1001752701
diff --git a/checkpoint-5000/rng_state_0.pth b/checkpoint-5000/rng_state_0.pth
deleted file mode 100644
index f73c216ce5fd22f5ecf938f9ce19490ebda0e246..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_0.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c3591569acf36220e21cfa3f00c334d4afa5214c3fa0f7f20b6081190208a2ce
-size 27772
diff --git a/checkpoint-5000/rng_state_1.pth b/checkpoint-5000/rng_state_1.pth
deleted file mode 100644
index 9a1bca1061cb9ecbb689954ed2b3c0139d4c0cc6..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_1.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8a3d8da1aa54796771be8e0f102c1ba0e9bce209cd7f83f5e4242dbd0a2bfb18
-size 27772
diff --git a/checkpoint-5000/rng_state_10.pth b/checkpoint-5000/rng_state_10.pth
deleted file mode 100644
index 80b4833fb8614da8c7b43ce2dc83031e875990e0..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_10.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:263b9c81bf6b52324cce079cb862bf0c4c6c076726306fe430175760cf77ce1d
-size 27789
diff --git a/checkpoint-5000/rng_state_11.pth b/checkpoint-5000/rng_state_11.pth
deleted file mode 100644
index 55da8e031dda486a87150730f3c006a6fbbf5def..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_11.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:bfd9622dd9c9e0f101a3891d78b76d8a750232389d97fff8a48e4ab0113e3bf0
-size 27789
diff --git a/checkpoint-5000/rng_state_12.pth b/checkpoint-5000/rng_state_12.pth
deleted file mode 100644
index 5b5cb3c73161b8926eb77bc67dfb981462a009f7..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_12.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8b52b3225a4c307e1e07d040be377b2268078fb40662cf123cf14c9225dfc3d2
-size 27789
diff --git a/checkpoint-5000/rng_state_13.pth b/checkpoint-5000/rng_state_13.pth
deleted file mode 100644
index 6dfe05530fcc36078e9ea3388e3129a9802a8105..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_13.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a7022a9a5c490e593972113d5eec0a181e018cdd0b74c023342974a3d2a43471
-size 27789
diff --git a/checkpoint-5000/rng_state_2.pth b/checkpoint-5000/rng_state_2.pth
deleted file mode 100644
index 5cc368ebea4eb59351da0dda32d9a0191a27645a..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_2.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7ea427538851652ebb74224ead7e27e9853d1a0254ab5742c7f4e6a75f1a155b
-size 27772
diff --git a/checkpoint-5000/rng_state_3.pth b/checkpoint-5000/rng_state_3.pth
deleted file mode 100644
index 2653f6afc0753f4f0a4b58884924393c50bb80e6..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_3.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:84c0d3bf83700c5dcf78d4bca3c01d4661af97db85b1e1021458aa4ebf191dc3
-size 27772
diff --git a/checkpoint-5000/rng_state_4.pth b/checkpoint-5000/rng_state_4.pth
deleted file mode 100644
index 17dbc94de833c85869043071ac3cf178e4029c25..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_4.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:88b40363540e71d8f1d1cd8dbf6a880e5a85fe8c36554f2c6a6e6bf87eeee7ef
-size 27772
diff --git a/checkpoint-5000/rng_state_5.pth b/checkpoint-5000/rng_state_5.pth
deleted file mode 100644
index df12ecaeda7900c0fd8445f8454fddbd7f69c384..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_5.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f452a098fe1f3d5946e80ca1866e99d8de678f832a877b5bd605c904adccd168
-size 27772
diff --git a/checkpoint-5000/rng_state_6.pth b/checkpoint-5000/rng_state_6.pth
deleted file mode 100644
index e13e80df498039dec0d69c9dc155f6312a63f53f..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_6.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d6329d34fc46a440591bbc38dc3e735aa628275c46bc5f5d67ea60d2ac817c9f
-size 27772
diff --git a/checkpoint-5000/rng_state_7.pth b/checkpoint-5000/rng_state_7.pth
deleted file mode 100644
index 065afb9b400ec0ab624b9e2e1bd15cd06cf59c21..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_7.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:abc478444408d585c8510980bf6c3724dbd04c62fe3f44191f641810f4f2b408
-size 27772
diff --git a/checkpoint-5000/rng_state_8.pth b/checkpoint-5000/rng_state_8.pth
deleted file mode 100644
index e358a2d86e15d530d6710914fdaeabf2e6ef4dbe..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_8.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:43a4f27fdaf452bec4190380281039b2452b0cc819d9babdb1883bb6338b79df
-size 27772
diff --git a/checkpoint-5000/rng_state_9.pth b/checkpoint-5000/rng_state_9.pth
deleted file mode 100644
index b723433adb48a109d110cdae4d73db16f086be84..0000000000000000000000000000000000000000
--- a/checkpoint-5000/rng_state_9.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:bd492bc5d4f48c5532176ee3ad99275b5bfcd315a528c245cfa8d46477f6b13e
-size 27772
diff --git a/checkpoint-5000/scheduler.pt b/checkpoint-5000/scheduler.pt
deleted file mode 100644
index e2325daf95e132d92ec86f58b07155dcd7d36553..0000000000000000000000000000000000000000
--- a/checkpoint-5000/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:091fab5b44662db384d56b3c50422b403065ff0f62fb64f68c521ac3c38ad752
-size 627
diff --git a/checkpoint-5000/training_args.bin b/checkpoint-5000/training_args.bin
deleted file mode 100644
index 3c48003adcc192172e325b8bb81af1b30fac42f7..0000000000000000000000000000000000000000
--- a/checkpoint-5000/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:354c4769acaf21317d8ab58ba2dd133763f3bee1aec7488fb334e45f3e80ebc3
-size 4027
diff --git a/checkpoint-5100/adapter_model.bin b/checkpoint-5100/adapter_model.bin
deleted file mode 100644
index 02bfb0de2c8392b01220dbad54f7d5ef7442c98a..0000000000000000000000000000000000000000
--- a/checkpoint-5100/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0782e3c048e8ec06b53914deeacadabf30a533ab881541cd5057d49805c57014
-size 500897101
diff --git a/checkpoint-5100/adapter_model/adapter_model.bin b/checkpoint-5100/adapter_model/adapter_model.bin
deleted file mode 100644
index 02bfb0de2c8392b01220dbad54f7d5ef7442c98a..0000000000000000000000000000000000000000
--- a/checkpoint-5100/adapter_model/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0782e3c048e8ec06b53914deeacadabf30a533ab881541cd5057d49805c57014
-size 500897101
diff --git a/checkpoint-5100/optimizer.pt b/checkpoint-5100/optimizer.pt
deleted file mode 100644
index b21a87e8fcf3f6c85917ddfde8ff26a8760467d8..0000000000000000000000000000000000000000
--- a/checkpoint-5100/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6e547facfed70ca3ced4bba623ceed57a68ada7036877bcb0fe8abdc4206a71d
-size 1001752701
diff --git a/checkpoint-5100/rng_state_0.pth b/checkpoint-5100/rng_state_0.pth
deleted file mode 100644
index efec54a19ef3ffcf3a35e80a278a57708f8818e3..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_0.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:93586c7c2f4af77dae57306cefbbba6e501b56255a6e8ab1e51526e93247ec0c
-size 27772
diff --git a/checkpoint-5100/rng_state_1.pth b/checkpoint-5100/rng_state_1.pth
deleted file mode 100644
index 006f0ce77824e8757b2a54d97497a090e281f67f..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_1.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:914cd17a4d5c2393130506ee74b380b7ebf49b994b8e1f7f9a5a5011789dcb9d
-size 27772
diff --git a/checkpoint-5100/rng_state_10.pth b/checkpoint-5100/rng_state_10.pth
deleted file mode 100644
index e924e089f5bee9985719b31ab4d4899670b1c7b3..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_10.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f79575017a903227eead6d8ec8c987f6c9f113b02cc3fdca1a05e6dfeb87c263
-size 27789
diff --git a/checkpoint-5100/rng_state_11.pth b/checkpoint-5100/rng_state_11.pth
deleted file mode 100644
index e74dbc2c8bb80a5090f72f29d5ad891986eb0b03..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_11.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e862437c6ef81136a36f5dcccf18047c8bf5b5ce5c4cb6a5de4068de8ac98fd4
-size 27789
diff --git a/checkpoint-5100/rng_state_12.pth b/checkpoint-5100/rng_state_12.pth
deleted file mode 100644
index c4ea8e665565e1e4ce619c18c3cf32bbb8416f68..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_12.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2bd910734bd5ed0209fccf18e21529e6637d89e5d932f3863bdeb79c5a9955a0
-size 27789
diff --git a/checkpoint-5100/rng_state_13.pth b/checkpoint-5100/rng_state_13.pth
deleted file mode 100644
index 4929b2e9b86f0460906db8eed7d1ab0156f238d2..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_13.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:bd706d0aeecfb525da3ab5daa901fe7638c2e7f5d4cee63cd71b6ca026275bdd
-size 27789
diff --git a/checkpoint-5100/rng_state_2.pth b/checkpoint-5100/rng_state_2.pth
deleted file mode 100644
index 5b6e339102453607790f1d3271c90300e1c20fb0..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_2.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a3cc4068be271200f493c6e5933125535d31c00d193a77baaf617e995cb80113
-size 27772
diff --git a/checkpoint-5100/rng_state_3.pth b/checkpoint-5100/rng_state_3.pth
deleted file mode 100644
index 3af67e7908ee466fca4f247cb88787d6b60f095a..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_3.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:134ec8578ce099215e557b373586d1334dcba1f9bc3678e21e8a11c8293273b5
-size 27772
diff --git a/checkpoint-5100/rng_state_4.pth b/checkpoint-5100/rng_state_4.pth
deleted file mode 100644
index 50ab2211005f0a24bf80d1ae93a75ee9073bedec..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_4.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2799584e6f3b97fb9250177cae1099c95a1a72f8c924828310d6e9c9f712a0ad
-size 27772
diff --git a/checkpoint-5100/rng_state_5.pth b/checkpoint-5100/rng_state_5.pth
deleted file mode 100644
index a237a79776db8339b3886a0cb5f1c1eed5125259..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_5.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d2d851757976cd5436fb4f7e4f6b90e86fd7eb7fd174ef2f06b786fab4c8b687
-size 27772
diff --git a/checkpoint-5100/rng_state_6.pth b/checkpoint-5100/rng_state_6.pth
deleted file mode 100644
index d0dc6ec1565fb3615ece7b1a24b4c7980b69e39c..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_6.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0944f297f8c989eaaaa8748e1b4a866de5757e645fa13d826211ad5f9bf81798
-size 27772
diff --git a/checkpoint-5100/rng_state_7.pth b/checkpoint-5100/rng_state_7.pth
deleted file mode 100644
index 3e592acb033fabefcc2e4a888058bfe7cff6aa4c..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_7.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f4847f06e89ac0c33e93f4108e29bba8a6a11b57185752e5a61d1d159db7176b
-size 27772
diff --git a/checkpoint-5100/rng_state_8.pth b/checkpoint-5100/rng_state_8.pth
deleted file mode 100644
index 7a5eb449223406d430f62368de0fca1b9ce65536..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_8.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:32e20dcbaf8912d2c4ea76cd78324e384e6e3f340b552198fd77b189a7f80400
-size 27772
diff --git a/checkpoint-5100/rng_state_9.pth b/checkpoint-5100/rng_state_9.pth
deleted file mode 100644
index 7522bf2d591e25026b8beb76abbbeff66bef52b9..0000000000000000000000000000000000000000
--- a/checkpoint-5100/rng_state_9.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6299cbf9ce668897a91d6363b1369a182cddf5e47a03415dbcb196480ea98de3
-size 27772
diff --git a/checkpoint-5100/scheduler.pt b/checkpoint-5100/scheduler.pt
deleted file mode 100644
index b0b8abd7dade13ecdfafa417ba979fa207247f37..0000000000000000000000000000000000000000
--- a/checkpoint-5100/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:04c0158b55de3dc26efbfe9fb78f379b4093417c7720f3a9de19f86082d0caf3
-size 627
diff --git a/checkpoint-5100/training_args.bin b/checkpoint-5100/training_args.bin
deleted file mode 100644
index 43b519cde185d2521e004dc718270044540f5e9c..0000000000000000000000000000000000000000
--- a/checkpoint-5100/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b5cc18faa1420e425c2fed06bfe2dd967461487c15531bd94429b7a3c0c02a49
-size 4027
diff --git a/checkpoint-5200/adapter_model.bin b/checkpoint-5200/adapter_model.bin
deleted file mode 100644
index 4603cec9d970dae967d1fe03601443f982651c54..0000000000000000000000000000000000000000
--- a/checkpoint-5200/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:28c2d0c51dd5ec8f66ff0bbdb8ae6185bd1eca75e6b3b3409367c09446351f5a
-size 500897101
diff --git a/checkpoint-5200/adapter_model/adapter_config.json b/checkpoint-5200/adapter_model/adapter_config.json
deleted file mode 100644
index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..0000000000000000000000000000000000000000
--- a/checkpoint-5200/adapter_model/adapter_config.json
+++ /dev/null
@@ -1,26 +0,0 @@
-{
-  "auto_mapping": null,
-  "base_model_name_or_path": "/workspace/webui/models/TheBloke_Llama-2-13B-fp16",
-  "bias": "none",
-  "fan_in_fan_out": null,
-  "inference_mode": true,
-  "init_lora_weights": true,
-  "layers_pattern": null,
-  "layers_to_transform": null,
-  "lora_alpha": 16,
-  "lora_dropout": 0.05,
-  "modules_to_save": null,
-  "peft_type": "LORA",
-  "r": 32,
-  "revision": null,
-  "target_modules": [
-    "v_proj",
-    "up_proj",
-    "k_proj",
-    "q_proj",
-    "down_proj",
-    "gate_proj",
-    "o_proj"
-  ],
-  "task_type": "CAUSAL_LM"
-}
\ No newline at end of file
diff --git a/checkpoint-5200/adapter_model/adapter_model.bin b/checkpoint-5200/adapter_model/adapter_model.bin
deleted file mode 100644
index 4603cec9d970dae967d1fe03601443f982651c54..0000000000000000000000000000000000000000
--- a/checkpoint-5200/adapter_model/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:28c2d0c51dd5ec8f66ff0bbdb8ae6185bd1eca75e6b3b3409367c09446351f5a
-size 500897101
diff --git a/checkpoint-5200/optimizer.pt b/checkpoint-5200/optimizer.pt
deleted file mode 100644
index 3bf258fce44f70ab030011d1d1bc825f78c75fe3..0000000000000000000000000000000000000000
--- a/checkpoint-5200/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:897aecb8fea53f1688ee40f5672ba9bf2f9263d05d96d719af5a024da878838c
-size 1001752701
diff --git a/checkpoint-5200/rng_state_0.pth b/checkpoint-5200/rng_state_0.pth
deleted file mode 100644
index 06dd14cb71f3b351e9ae50bdb44b62e88cde3b31..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_0.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7d3ab65c749e5fc734aff9ca0257ff2b5fbec92bf74548f706dd50a3522d9444
-size 27772
diff --git a/checkpoint-5200/rng_state_1.pth b/checkpoint-5200/rng_state_1.pth
deleted file mode 100644
index 8b972a8eb856a661fcd533cae37605b2b2fb95f8..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_1.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0ac25dcd9dd77c6157fe871ffedc3311d277b0f3767923cc0debee8decbcac7c
-size 27772
diff --git a/checkpoint-5200/rng_state_10.pth b/checkpoint-5200/rng_state_10.pth
deleted file mode 100644
index eaf20c8bbef0790aa366c98de761027cb6f3de0a..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_10.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e8ef400cc06c347a4b973def87d07c600ccc0901bb7459cbac62d3b61528b1ea
-size 27789
diff --git a/checkpoint-5200/rng_state_11.pth b/checkpoint-5200/rng_state_11.pth
deleted file mode 100644
index b79a3c538aa7e18f090761946d884b3367298366..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_11.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:943fb5b9798db2076d7d142d97ef850652f063b322a6b291b70fd36b2873faee
-size 27789
diff --git a/checkpoint-5200/rng_state_12.pth b/checkpoint-5200/rng_state_12.pth
deleted file mode 100644
index 9987c8ffddad292a42cdc5894c097ac31c1d47d7..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_12.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4ba67e4d875ae627926fabe393d78116d78522c74be3715f12895caeb0451111
-size 27789
diff --git a/checkpoint-5200/rng_state_13.pth b/checkpoint-5200/rng_state_13.pth
deleted file mode 100644
index 091de895d16cccb3c6da890b8639bad827edea90..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_13.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:5c1a40cb952561fb635e6a63b2e31f99fe76eb7379d5250b36d6ceae7607d513
-size 27789
diff --git a/checkpoint-5200/rng_state_2.pth b/checkpoint-5200/rng_state_2.pth
deleted file mode 100644
index 081a4e852e0f8945fcf0c1bbe401c18bba590a86..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_2.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f49dff9815ef5438a07a8ce0274d35913fc7fd66a9c5e39708a3ed2f5a34531d
-size 27772
diff --git a/checkpoint-5200/rng_state_3.pth b/checkpoint-5200/rng_state_3.pth
deleted file mode 100644
index da61e91972422c74a684f9de7488fed4771a6d30..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_3.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d74211b2b26e9e6e27b2c293da7f898aff1fb43b386304ece8902e9e03cf6ea2
-size 27772
diff --git a/checkpoint-5200/rng_state_4.pth b/checkpoint-5200/rng_state_4.pth
deleted file mode 100644
index bd87d2b76577161b6b76cdf9be44d998e91a208b..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_4.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f5969252b504ae24eacec7e5ddc1b6375bff73d3b276cd991e25169c2101ec3c
-size 27772
diff --git a/checkpoint-5200/rng_state_5.pth b/checkpoint-5200/rng_state_5.pth
deleted file mode 100644
index dab5412dfe05e034051e75149d46fe7c2e4409e3..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_5.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d96767afd301e0dfec9849df22aeb52b119511b35dae4fd79e1b3e8bab29d1b8
-size 27772
diff --git a/checkpoint-5200/rng_state_6.pth b/checkpoint-5200/rng_state_6.pth
deleted file mode 100644
index e8d658bdb81092c1bac24484fd73ca8641c50917..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_6.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:25bc6e2e8c95bccdcf883e1283d17bb4645e87943be9d87983483a6e0ea62d19
-size 27772
diff --git a/checkpoint-5200/rng_state_7.pth b/checkpoint-5200/rng_state_7.pth
deleted file mode 100644
index cef9722d3a1c0ad35789ef056eaa8bbfabe62e88..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_7.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:07239f8fab222d643c376b32e823fe2fa4e52c750e68bd07603feed81ab05f92
-size 27772
diff --git a/checkpoint-5200/rng_state_8.pth b/checkpoint-5200/rng_state_8.pth
deleted file mode 100644
index 0bc0db080dd211eb9114f10f4d7d5860fcd1251b..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_8.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:126ef2192c7378d259ac9b7f6cc0f79e375ae619b07be1f34655a49f1c8090fa
-size 27772
diff --git a/checkpoint-5200/rng_state_9.pth b/checkpoint-5200/rng_state_9.pth
deleted file mode 100644
index dd196ac0cbfe92f452825a78370a30048b487390..0000000000000000000000000000000000000000
--- a/checkpoint-5200/rng_state_9.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4c655791adbb1473fdfbba3cd090a95b3182ba0fabeb7693d4b7675966dd0edc
-size 27772
diff --git a/checkpoint-5200/scheduler.pt b/checkpoint-5200/scheduler.pt
deleted file mode 100644
index 09b47cb01e336327b19380c7da592c19c4199ffc..0000000000000000000000000000000000000000
--- a/checkpoint-5200/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c657cc9c9f16f76f05d9497e2e29beeb126df858e2b635edfaa2b24e78fb2f61
-size 627
diff --git a/checkpoint-5200/training_args.bin b/checkpoint-5200/training_args.bin
deleted file mode 100644
index 43b519cde185d2521e004dc718270044540f5e9c..0000000000000000000000000000000000000000
--- a/checkpoint-5200/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b5cc18faa1420e425c2fed06bfe2dd967461487c15531bd94429b7a3c0c02a49
-size 4027
diff --git a/checkpoint-5300/adapter_model.bin b/checkpoint-5300/adapter_model.bin
deleted file mode 100644
index 3e8f72f386e2c3fe895fcb01c3f1de5f5fec965a..0000000000000000000000000000000000000000
--- a/checkpoint-5300/adapter_model.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:14ca48bd88a31002dc05f9274bc978bc8b5b8ae3e51470e74ee7bc0bb12284e9
-size 500897101
diff --git a/checkpoint-5300/optimizer.pt b/checkpoint-5300/optimizer.pt
deleted file mode 100644
index 5b8133534a2b769e5c5d5403b729c67018470260..0000000000000000000000000000000000000000
--- a/checkpoint-5300/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:869a51ca719bee8b6aab465be97fa4ac5e228c769321c2712f644067ceeca076
-size 1001752701
diff --git a/checkpoint-5300/rng_state_0.pth b/checkpoint-5300/rng_state_0.pth
deleted file mode 100644
index 552dc8ef95a545c64426e4c5711d142bd87b7760..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_0.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9267467db4bfc0b62f4b2992b98c478568d6b740025cdb5016f4102da1504163
-size 27772
diff --git a/checkpoint-5300/rng_state_1.pth b/checkpoint-5300/rng_state_1.pth
deleted file mode 100644
index cf291739827b5154f004a189694861e364b08a68..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_1.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ea0db0e586ec1c1e547243b2e02d8b0d760f3d113e51420b567322fb80b86283
-size 27772
diff --git a/checkpoint-5300/rng_state_10.pth b/checkpoint-5300/rng_state_10.pth
deleted file mode 100644
index 839a575806286f384bca65e6c6ed4b642fee5af0..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_10.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fcfb12512c0be896f0842434c14afaa23ede7d6aadbd83bfd18570859fcdecdd
-size 27789
diff --git a/checkpoint-5300/rng_state_11.pth b/checkpoint-5300/rng_state_11.pth
deleted file mode 100644
index 494cf039101c4fc79b0f4f48619b309ef5eeca44..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_11.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fcd57397386863534e25c2052e0eb5a3986965528e8332bead4e6da6c8a52a60
-size 27789
diff --git a/checkpoint-5300/rng_state_12.pth b/checkpoint-5300/rng_state_12.pth
deleted file mode 100644
index d1ab254f55a9249593c17a205b750a8399f6942e..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_12.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3b494220b086ab33c457cd9cb3298d5707ae27861e1a1ea15cf7b2846c34edb3
-size 27789
diff --git a/checkpoint-5300/rng_state_13.pth b/checkpoint-5300/rng_state_13.pth
deleted file mode 100644
index e7da07b270a41ff605eff193c3c775f63cefdf4b..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_13.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:66ddbbc44b73707a46dbe70a821775b9215bfb3188b97867dfd5d788f2c4bd1b
-size 27789
diff --git a/checkpoint-5300/rng_state_2.pth b/checkpoint-5300/rng_state_2.pth
deleted file mode 100644
index 8b750c8a0158ec37f230d464ed21d7088af86a15..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_2.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e09271dc29724c758580e8e6864e76555b7a1dd95ca5d0036f08cdd9f67fbaec
-size 27772
diff --git a/checkpoint-5300/rng_state_3.pth b/checkpoint-5300/rng_state_3.pth
deleted file mode 100644
index ec433ee7fc69d37df74002cecc5f6319b94e268f..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_3.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:65b0c519b8283902066db24d39bebbf0ec0f57d632779c56be9c9d58f7cdb78e
-size 27772
diff --git a/checkpoint-5300/rng_state_4.pth b/checkpoint-5300/rng_state_4.pth
deleted file mode 100644
index dc27c448e896fad22f68efc178f08e10e7431ab5..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_4.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:868a6a26d82f017652ee4b9e21c96ec36ab5f96be4eeedf65e27eda71ff93f25
-size 27772
diff --git a/checkpoint-5300/rng_state_5.pth b/checkpoint-5300/rng_state_5.pth
deleted file mode 100644
index fa32e1f6b7712309b3c8943e87f2650e2c5a13cb..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_5.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d82c47d40cdc9cbed8bc1b1f8fdcb354fb8b6ac525cfce07fab2d1af5791c195
-size 27772
diff --git a/checkpoint-5300/rng_state_6.pth b/checkpoint-5300/rng_state_6.pth
deleted file mode 100644
index 28ae8ef924932d456fd13a2995c8932487990c8e..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_6.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:64d8ec328ebab19d4fa69241bbb5de66af7b09aa5f0d71d9e37be38a5170d24e
-size 27772
diff --git a/checkpoint-5300/rng_state_7.pth b/checkpoint-5300/rng_state_7.pth
deleted file mode 100644
index d9ecf5bafb7af425590b22c77078d9409670f728..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_7.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cf9d89caef032992b8f5efcdaf7ab987e37e4fb52ec8d47520f814092e1e7ab3
-size 27772
diff --git a/checkpoint-5300/rng_state_8.pth b/checkpoint-5300/rng_state_8.pth
deleted file mode 100644
index 34110f26cf1c2d148a91aa260ddf93627bdc3069..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_8.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8913ebfea32419c486eaa9895c49a7962a44933cd37f4965710a3560fe737c25
-size 27772
diff --git a/checkpoint-5300/rng_state_9.pth b/checkpoint-5300/rng_state_9.pth
deleted file mode 100644
index acee305b8ff2eb6687dabfd9c1220f25aacfff20..0000000000000000000000000000000000000000
--- a/checkpoint-5300/rng_state_9.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:685f43d3417ce77333bd61cb9e79c3d6e0421bb659bae8689caafc6c6b0d8752
-size 27772
diff --git a/checkpoint-5300/scheduler.pt b/checkpoint-5300/scheduler.pt
deleted file mode 100644
index c25a03466ceea6c5cb534559ebdfa7a51ae48c90..0000000000000000000000000000000000000000
--- a/checkpoint-5300/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0d904fb502ced275ef5e7925781f477f4c89d48daa60e9f45b9339adf1aaa77d
-size 627
diff --git a/checkpoint-5000/README.md b/checkpoint-5400/README.md
similarity index 100%
rename from checkpoint-5000/README.md
rename to checkpoint-5400/README.md
diff --git a/checkpoint-5300/adapter_config.json b/checkpoint-5400/adapter_config.json
similarity index 100%
rename from checkpoint-5300/adapter_config.json
rename to checkpoint-5400/adapter_config.json
diff --git a/checkpoint-5400/adapter_model.bin b/checkpoint-5400/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd156ad5028e919f5cb218fb803514d02505cbc1
--- /dev/null
+++ b/checkpoint-5400/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a996a2cd6511d12fe1f6c74e5551595b29964345d9c5913a1440514d20e74909
+size 500897101
diff --git a/checkpoint-5000/adapter_model/README.md b/checkpoint-5400/adapter_model/README.md
similarity index 100%
rename from checkpoint-5000/adapter_model/README.md
rename to checkpoint-5400/adapter_model/README.md
diff --git a/checkpoint-5000/adapter_config.json b/checkpoint-5400/adapter_model/adapter_config.json
similarity index 100%
rename from checkpoint-5000/adapter_config.json
rename to checkpoint-5400/adapter_model/adapter_config.json
index 2086dcb8a3bcbe9772b1971a2a24239b77070fbb..5b3f45c250ff330299d2364a46de0623dadd2f48 100644
--- a/checkpoint-5000/adapter_config.json
+++ b/checkpoint-5400/adapter_model/adapter_config.json
@@ -14,12 +14,12 @@
   "r": 32,
   "revision": null,
   "target_modules": [
-    "k_proj",
+    "q_proj",
+    "gate_proj",
     "o_proj",
     "down_proj",
-    "gate_proj",
+    "k_proj",
     "v_proj",
-    "q_proj",
     "up_proj"
   ],
   "task_type": "CAUSAL_LM"
diff --git a/checkpoint-5400/adapter_model/adapter_model.bin b/checkpoint-5400/adapter_model/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd156ad5028e919f5cb218fb803514d02505cbc1
--- /dev/null
+++ b/checkpoint-5400/adapter_model/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a996a2cd6511d12fe1f6c74e5551595b29964345d9c5913a1440514d20e74909
+size 500897101
diff --git a/checkpoint-5400/optimizer.pt b/checkpoint-5400/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..7555b0c057bbcb347ed43d17da54abb9e1d8111d
--- /dev/null
+++ b/checkpoint-5400/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a049c191517e4cc2442d5e383237bf35c7e90159b14ee20f4ef3f1e917c94f7d
+size 1001752701
diff --git a/checkpoint-5400/rng_state_0.pth b/checkpoint-5400/rng_state_0.pth
new file mode 100644
index 0000000000000000000000000000000000000000..647a6426e65252cf43935d08344af7babeb064c0
--- /dev/null
+++ b/checkpoint-5400/rng_state_0.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7bb5c299ce12f96c89868d521ed520c7ace1a7a288b7b7a826d6e603aeb79a09
+size 27772
diff --git a/checkpoint-5400/rng_state_1.pth b/checkpoint-5400/rng_state_1.pth
new file mode 100644
index 0000000000000000000000000000000000000000..9724602cab7fc1a573eb5dfd68d8f25fd3ba9939
--- /dev/null
+++ b/checkpoint-5400/rng_state_1.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c1b9ccab0a7c765a8ccd991c977a9ffc75c10546853ccb44210b37c9347c640
+size 27772
diff --git a/checkpoint-5400/rng_state_10.pth b/checkpoint-5400/rng_state_10.pth
new file mode 100644
index 0000000000000000000000000000000000000000..022296ad01f7119105de863dfecde9f2e14fdc5b
--- /dev/null
+++ b/checkpoint-5400/rng_state_10.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a9597f7462f3230a6cbef5e02b36f74b70ccfcdcc850d8c7e131d92db196783
+size 27789
diff --git a/checkpoint-5400/rng_state_11.pth b/checkpoint-5400/rng_state_11.pth
new file mode 100644
index 0000000000000000000000000000000000000000..56f555cbe7b4f5a0bfdd45d1c41592d5b3e9f922
--- /dev/null
+++ b/checkpoint-5400/rng_state_11.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8af70b0d7c5428460585eb71f0762f807411f8fcb9745d5f3d67da929bebac6
+size 27789
diff --git a/checkpoint-5400/rng_state_12.pth b/checkpoint-5400/rng_state_12.pth
new file mode 100644
index 0000000000000000000000000000000000000000..1be68b3531c92a104382b223bcd2a5e21cdea62b
--- /dev/null
+++ b/checkpoint-5400/rng_state_12.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e6923f879a023dad7d6429c5f4ae2372fbd5ee6569ab6149a7cdae5b14fb3c3
+size 27789
diff --git a/checkpoint-5400/rng_state_13.pth b/checkpoint-5400/rng_state_13.pth
new file mode 100644
index 0000000000000000000000000000000000000000..23988612a99f202bd1f90afecb4bb41fb555be99
--- /dev/null
+++ b/checkpoint-5400/rng_state_13.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c5a179975104cf77a9e13a52a805da05b0e24a85d3849b0f5c3e5420f17eea8
+size 27789
diff --git a/checkpoint-5400/rng_state_2.pth b/checkpoint-5400/rng_state_2.pth
new file mode 100644
index 0000000000000000000000000000000000000000..254c5961935c97254ef1f4227805b6f27c4edaea
--- /dev/null
+++ b/checkpoint-5400/rng_state_2.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:739e768c2ad37f578b983337dedf3c7558c279d10f81301e90d17df333839571
+size 27772
diff --git a/checkpoint-5400/rng_state_3.pth b/checkpoint-5400/rng_state_3.pth
new file mode 100644
index 0000000000000000000000000000000000000000..03da82bdfdad227d441685f3eaef44508556a1be
--- /dev/null
+++ b/checkpoint-5400/rng_state_3.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ef2ea61eeb1cf909c75298fb11154372946533cb23888c32bb3d5dbf8f450be
+size 27772
diff --git a/checkpoint-5400/rng_state_4.pth b/checkpoint-5400/rng_state_4.pth
new file mode 100644
index 0000000000000000000000000000000000000000..cd14e28b48e5f9f2574ee0d75c78927f9119c929
--- /dev/null
+++ b/checkpoint-5400/rng_state_4.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6a0df83ddd7c2adb2cfaa37c8e8ef974c3ee5b10b047c9debb55e91b9c6abfa0
+size 27772
diff --git a/checkpoint-5400/rng_state_5.pth b/checkpoint-5400/rng_state_5.pth
new file mode 100644
index 0000000000000000000000000000000000000000..07748b51d97d028c3487f01b56d39221b95d1fd8
--- /dev/null
+++ b/checkpoint-5400/rng_state_5.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28d8090af65c1044a84f75fca5aaad6150338b890ba2ff8a597eb42e98730156
+size 27772
diff --git a/checkpoint-5400/rng_state_6.pth b/checkpoint-5400/rng_state_6.pth
new file mode 100644
index 0000000000000000000000000000000000000000..7f8ad871dcef65ddc3c6d6c74943d5af367e93da
--- /dev/null
+++ b/checkpoint-5400/rng_state_6.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39eb6a8461a3f8f64867ca24431f39e0c189f967e51fc06b1cd04b61557b7ab5
+size 27772
diff --git a/checkpoint-5400/rng_state_7.pth b/checkpoint-5400/rng_state_7.pth
new file mode 100644
index 0000000000000000000000000000000000000000..3ca23cfac756660d83bdfb1aba90ee48188b0f64
--- /dev/null
+++ b/checkpoint-5400/rng_state_7.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c082109f0ab8381e4f9518c09cb1c66ba874df40524ab79671e907b2bae40124
+size 27772
diff --git a/checkpoint-5400/rng_state_8.pth b/checkpoint-5400/rng_state_8.pth
new file mode 100644
index 0000000000000000000000000000000000000000..a0f7361e8b7974957dfa1528f4444566f026e19c
--- /dev/null
+++ b/checkpoint-5400/rng_state_8.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e09522662a1c7e523f238f6591ac23db965da78361158348b4370a4a0e5cadc9
+size 27772
diff --git a/checkpoint-5400/rng_state_9.pth b/checkpoint-5400/rng_state_9.pth
new file mode 100644
index 0000000000000000000000000000000000000000..58b1b613012a8d080ec41d7e4c15bd56c5c5cec8
--- /dev/null
+++ b/checkpoint-5400/rng_state_9.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0b144a36861671d0f406faba8754207d253d86202309d2a0cf2f6675277d4179
+size 27772
diff --git a/checkpoint-5400/scheduler.pt b/checkpoint-5400/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..d1be0e334dd83be886ca4f8fac072c80978e3367
--- /dev/null
+++ b/checkpoint-5400/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ced8c2de33809dd534295dd5742d2284a2f142b85e0e85a7f49385eb1bef7354
+size 627
diff --git a/checkpoint-5300/trainer_state.json b/checkpoint-5400/trainer_state.json
similarity index 97%
rename from checkpoint-5300/trainer_state.json
rename to checkpoint-5400/trainer_state.json
index 119d10f474474ee53860d56031071f00f9c5117c..2189af52f6e9c44add63f68f896d86aa0f21830e 100644
--- a/checkpoint-5300/trainer_state.json
+++ b/checkpoint-5400/trainer_state.json
@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.055060100814269,
-  "global_step": 5300,
+  "epoch": 2.093834819697557,
+  "global_step": 5400,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1294,11 +1294,35 @@
       "learning_rate": 4.519953408196152e-05,
       "loss": 0.7424,
       "step": 5300
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.435215802306635e-05,
+      "loss": 0.7521,
+      "step": 5325
+    },
+    {
+      "epoch": 2.07,
+      "learning_rate": 4.351053109942894e-05,
+      "loss": 0.7477,
+      "step": 5350
+    },
+    {
+      "epoch": 2.08,
+      "learning_rate": 4.2674740261896776e-05,
+      "loss": 0.7456,
+      "step": 5375
+    },
+    {
+      "epoch": 2.09,
+      "learning_rate": 4.1844871858374844e-05,
+      "loss": 0.766,
+      "step": 5400
     }
   ],
   "max_steps": 7737,
   "num_train_epochs": 3,
-  "total_flos": 2.282482987033428e+19,
+  "total_flos": 2.325582880769573e+19,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/checkpoint-5300/training_args.bin b/checkpoint-5400/training_args.bin
similarity index 100%
rename from checkpoint-5300/training_args.bin
rename to checkpoint-5400/training_args.bin
diff --git a/checkpoint-5100/README.md b/checkpoint-5500/README.md
similarity index 100%
rename from checkpoint-5100/README.md
rename to checkpoint-5500/README.md
diff --git a/checkpoint-5000/adapter_model/adapter_config.json b/checkpoint-5500/adapter_config.json
similarity index 100%
rename from checkpoint-5000/adapter_model/adapter_config.json
rename to checkpoint-5500/adapter_config.json
index 2086dcb8a3bcbe9772b1971a2a24239b77070fbb..5b3f45c250ff330299d2364a46de0623dadd2f48 100644
--- a/checkpoint-5000/adapter_model/adapter_config.json
+++ b/checkpoint-5500/adapter_config.json
@@ -14,12 +14,12 @@
   "r": 32,
   "revision": null,
   "target_modules": [
-    "k_proj",
+    "q_proj",
+    "gate_proj",
     "o_proj",
     "down_proj",
-    "gate_proj",
+    "k_proj",
     "v_proj",
-    "q_proj",
     "up_proj"
   ],
   "task_type": "CAUSAL_LM"
diff --git a/checkpoint-5500/adapter_model.bin b/checkpoint-5500/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f25b271253aa1d3a3bd632c7016f808689db2a29
--- /dev/null
+++ b/checkpoint-5500/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c7243d5bc7b28d5d5a4bafb40fe933dd1f5d2b41c4b35311c4562dd50c5883a
+size 500897101
diff --git a/checkpoint-5100/adapter_model/README.md b/checkpoint-5500/adapter_model/README.md
similarity index 100%
rename from checkpoint-5100/adapter_model/README.md
rename to checkpoint-5500/adapter_model/README.md
diff --git a/checkpoint-5100/adapter_config.json b/checkpoint-5500/adapter_model/adapter_config.json
similarity index 94%
rename from checkpoint-5100/adapter_config.json
rename to checkpoint-5500/adapter_model/adapter_config.json
index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..5b3f45c250ff330299d2364a46de0623dadd2f48 100644
--- a/checkpoint-5100/adapter_config.json
+++ b/checkpoint-5500/adapter_model/adapter_config.json
@@ -14,13 +14,13 @@
   "r": 32,
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "up_proj",
-    "k_proj",
     "q_proj",
-    "down_proj",
     "gate_proj",
-    "o_proj"
+    "o_proj",
+    "down_proj",
+    "k_proj",
+    "v_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM"
 }
\ No newline at end of file
diff --git a/checkpoint-5500/adapter_model/adapter_model.bin b/checkpoint-5500/adapter_model/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f25b271253aa1d3a3bd632c7016f808689db2a29
--- /dev/null
+++ b/checkpoint-5500/adapter_model/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c7243d5bc7b28d5d5a4bafb40fe933dd1f5d2b41c4b35311c4562dd50c5883a
+size 500897101
diff --git a/checkpoint-5500/optimizer.pt b/checkpoint-5500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..9de25741384aed487c7fd491f6d7000ab7391a28
--- /dev/null
+++ b/checkpoint-5500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80adf9c30a8a3ebab96b13b5000ed1b3eb4306228d36a12dfadc4e7cc433a4ec
+size 1001752701
diff --git a/checkpoint-5500/rng_state_0.pth b/checkpoint-5500/rng_state_0.pth
new file mode 100644
index 0000000000000000000000000000000000000000..375583ee0114caccc2517feebcce2c8d1c5bbef2
--- /dev/null
+++ b/checkpoint-5500/rng_state_0.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30e0a79fb2da13095943ed5d6ff4010e829f95de5b910b4f831e610487314e6f
+size 27772
diff --git a/checkpoint-5500/rng_state_1.pth b/checkpoint-5500/rng_state_1.pth
new file mode 100644
index 0000000000000000000000000000000000000000..54a3655e3b78b20585701028c092f2637fd2ce00
--- /dev/null
+++ b/checkpoint-5500/rng_state_1.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5459f0eefaad357478856f70446e39da7b343e17571839caaa8a02c194f7d669
+size 27772
diff --git a/checkpoint-5500/rng_state_10.pth b/checkpoint-5500/rng_state_10.pth
new file mode 100644
index 0000000000000000000000000000000000000000..75a9f4a9e9fd3a7a62591d00ff06be84e71aea34
--- /dev/null
+++ b/checkpoint-5500/rng_state_10.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:386be381ea58870ea29c419ee56fe49473c2a98987edeacf220a45b1a2223941
+size 27789
diff --git a/checkpoint-5500/rng_state_11.pth b/checkpoint-5500/rng_state_11.pth
new file mode 100644
index 0000000000000000000000000000000000000000..b586bcfc5015187309aa7af69f45cbb254144307
--- /dev/null
+++ b/checkpoint-5500/rng_state_11.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d4e40b2e53f6a7d00bfd79e9648b446e522e5f1b008a72d0ecf49f8afaa037c8
+size 27789
diff --git a/checkpoint-5500/rng_state_12.pth b/checkpoint-5500/rng_state_12.pth
new file mode 100644
index 0000000000000000000000000000000000000000..c29c388f13f32dae9c32e4c071fda464405a9322
--- /dev/null
+++ b/checkpoint-5500/rng_state_12.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:800d188559c734beb02115217b063e8bb6cb7259475ac5e72045222c4e97d3ae
+size 27789
diff --git a/checkpoint-5500/rng_state_13.pth b/checkpoint-5500/rng_state_13.pth
new file mode 100644
index 0000000000000000000000000000000000000000..3ba5ed295cf29346055bdd5cf0eafe42825ef71a
--- /dev/null
+++ b/checkpoint-5500/rng_state_13.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:675b5fc0a7deb4335cae143f3a24d62ea65052ce52feb5d15793418be4662ac8
+size 27789
diff --git a/checkpoint-5500/rng_state_2.pth b/checkpoint-5500/rng_state_2.pth
new file mode 100644
index 0000000000000000000000000000000000000000..4680c515e6a46cff17f2e62d732fb07f95ab77ba
--- /dev/null
+++ b/checkpoint-5500/rng_state_2.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6acf616edcf44f8c9ecee1675d30b9f4f2d2de918203c9ebb49e8a44b17d57c
+size 27772
diff --git a/checkpoint-5500/rng_state_3.pth b/checkpoint-5500/rng_state_3.pth
new file mode 100644
index 0000000000000000000000000000000000000000..64ec2a11029a7441175ee5542c99c46dc5619f04
--- /dev/null
+++ b/checkpoint-5500/rng_state_3.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b2a7c589905769b0dbc43278783063253c4361403cb5e93a12c744d0c001f090
+size 27772
diff --git a/checkpoint-5500/rng_state_4.pth b/checkpoint-5500/rng_state_4.pth
new file mode 100644
index 0000000000000000000000000000000000000000..5227670a97240c57e138f4d60872d572b75fc996
--- /dev/null
+++ b/checkpoint-5500/rng_state_4.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3eca9eeb1ff3b7857657d5e2e3990c3de3e6f2dc13c394c9ae206a0dc471b87a
+size 27772
diff --git a/checkpoint-5500/rng_state_5.pth b/checkpoint-5500/rng_state_5.pth
new file mode 100644
index 0000000000000000000000000000000000000000..8a33ed4598f2324bbe058926b7491927b7b77932
--- /dev/null
+++ b/checkpoint-5500/rng_state_5.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b17e2394c1de98b9b25d7d58415327217900745e09f7ab9276a36f8c4ea50f4f
+size 27772
diff --git a/checkpoint-5500/rng_state_6.pth b/checkpoint-5500/rng_state_6.pth
new file mode 100644
index 0000000000000000000000000000000000000000..ca5795980d78ac96cd5daf1bdf5c0858e8b2a832
--- /dev/null
+++ b/checkpoint-5500/rng_state_6.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a1131467c982915441e4d4625565d4d9601fd3f17521d48e909b1e53bfaff94c
+size 27772
diff --git a/checkpoint-5500/rng_state_7.pth b/checkpoint-5500/rng_state_7.pth
new file mode 100644
index 0000000000000000000000000000000000000000..fb891e32df8c55a1398132e80f30d6e272792afb
--- /dev/null
+++ b/checkpoint-5500/rng_state_7.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:293b86ebb5ed10caa66ef5329f9bec84416b4637fe61389a51d73c4026771d2c
+size 27772
diff --git a/checkpoint-5500/rng_state_8.pth b/checkpoint-5500/rng_state_8.pth
new file mode 100644
index 0000000000000000000000000000000000000000..acd4ffee7fb61ee99058b6beda1331dcd5f97e75
--- /dev/null
+++ b/checkpoint-5500/rng_state_8.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:686f925d57ef5c5206a88fc40e5fc96231e3bf44a2a0b7213509ab2181ee4b8f
+size 27772
diff --git a/checkpoint-5500/rng_state_9.pth b/checkpoint-5500/rng_state_9.pth
new file mode 100644
index 0000000000000000000000000000000000000000..078b89d1d2eb8b5500cfe358a93cf0ab5b560d5c
--- /dev/null
+++ b/checkpoint-5500/rng_state_9.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f2aba6953f527967beec2652c8b9c0bb338e770c0158e5e0f3e5100d0f7bc63
+size 27772
diff --git a/checkpoint-5500/scheduler.pt b/checkpoint-5500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..a13f5f4b1c314e1988588849c40d157694f99e3a
--- /dev/null
+++ b/checkpoint-5500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ceeb3b5fc20812592b97207e07386031eb6265ebb23202022487dfc5a6412586
+size 627
diff --git a/checkpoint-5200/trainer_state.json b/checkpoint-5500/trainer_state.json
similarity index 94%
rename from checkpoint-5200/trainer_state.json
rename to checkpoint-5500/trainer_state.json
index 97b3abd665702c8773f0ea57e83d10c932db6f9d..e329e3c79569c013bed16a6058c7908dcf40a6a7 100644
--- a/checkpoint-5200/trainer_state.json
+++ b/checkpoint-5500/trainer_state.json
@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.016285381930981,
-  "global_step": 5200,
+  "epoch": 2.1326095385808452,
+  "global_step": 5500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1270,11 +1270,83 @@
       "learning_rate": 4.864477005494938e-05,
       "loss": 0.7654,
       "step": 5200
+    },
+    {
+      "epoch": 2.03,
+      "learning_rate": 4.777527870665592e-05,
+      "loss": 0.7468,
+      "step": 5225
+    },
+    {
+      "epoch": 2.04,
+      "learning_rate": 4.691118284138296e-05,
+      "loss": 0.7359,
+      "step": 5250
+    },
+    {
+      "epoch": 2.05,
+      "learning_rate": 4.605257173130763e-05,
+      "loss": 0.7422,
+      "step": 5275
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.519953408196152e-05,
+      "loss": 0.7424,
+      "step": 5300
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.435215802306635e-05,
+      "loss": 0.7521,
+      "step": 5325
+    },
+    {
+      "epoch": 2.07,
+      "learning_rate": 4.351053109942894e-05,
+      "loss": 0.7477,
+      "step": 5350
+    },
+    {
+      "epoch": 2.08,
+      "learning_rate": 4.2674740261896776e-05,
+      "loss": 0.7456,
+      "step": 5375
+    },
+    {
+      "epoch": 2.09,
+      "learning_rate": 4.1844871858374844e-05,
+      "loss": 0.766,
+      "step": 5400
+    },
+    {
+      "epoch": 2.1,
+      "learning_rate": 4.1021011624904814e-05,
+      "loss": 0.7664,
+      "step": 5425
+    },
+    {
+      "epoch": 2.11,
+      "learning_rate": 4.0203244676807353e-05,
+      "loss": 0.7703,
+      "step": 5450
+    },
+    {
+      "epoch": 2.12,
+      "learning_rate": 3.939165549988873e-05,
+      "loss": 0.7674,
+      "step": 5475
+    },
+    {
+      "epoch": 2.13,
+      "learning_rate": 3.858632794171222e-05,
+      "loss": 0.7722,
+      "step": 5500
     }
   ],
   "max_steps": 7737,
   "num_train_epochs": 3,
-  "total_flos": 2.2394545727200035e+19,
+  "total_flos": 2.3687017848899633e+19,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/checkpoint-5500/training_args.bin b/checkpoint-5500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1
--- /dev/null
+++ b/checkpoint-5500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6
+size 4027
diff --git a/checkpoint-5200/README.md b/checkpoint-5600/README.md
similarity index 100%
rename from checkpoint-5200/README.md
rename to checkpoint-5600/README.md
diff --git a/checkpoint-5100/adapter_model/adapter_config.json b/checkpoint-5600/adapter_config.json
similarity index 94%
rename from checkpoint-5100/adapter_model/adapter_config.json
rename to checkpoint-5600/adapter_config.json
index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..5b3f45c250ff330299d2364a46de0623dadd2f48 100644
--- a/checkpoint-5100/adapter_model/adapter_config.json
+++ b/checkpoint-5600/adapter_config.json
@@ -14,13 +14,13 @@
   "r": 32,
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "up_proj",
-    "k_proj",
     "q_proj",
-    "down_proj",
     "gate_proj",
-    "o_proj"
+    "o_proj",
+    "down_proj",
+    "k_proj",
+    "v_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM"
 }
\ No newline at end of file
diff --git a/checkpoint-5600/adapter_model.bin b/checkpoint-5600/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..427abc5179a9c1573bde250175a84acdb13acb5a
--- /dev/null
+++ b/checkpoint-5600/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e96ff867e21cc9653b08a6604c2b9fee34b49567f39bc3b5219920c59a1ad479
+size 500897101
diff --git a/checkpoint-5200/adapter_model/README.md b/checkpoint-5600/adapter_model/README.md
similarity index 100%
rename from checkpoint-5200/adapter_model/README.md
rename to checkpoint-5600/adapter_model/README.md
diff --git a/checkpoint-5600/adapter_model/adapter_config.json b/checkpoint-5600/adapter_model/adapter_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..5b3f45c250ff330299d2364a46de0623dadd2f48
--- /dev/null
+++ b/checkpoint-5600/adapter_model/adapter_config.json
@@ -0,0 +1,26 @@
+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/workspace/webui/models/TheBloke_Llama-2-13B-fp16",
+  "bias": "none",
+  "fan_in_fan_out": null,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 16,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 32,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "gate_proj",
+    "o_proj",
+    "down_proj",
+    "k_proj",
+    "v_proj",
+    "up_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}
\ No newline at end of file
diff --git a/checkpoint-5600/adapter_model/adapter_model.bin b/checkpoint-5600/adapter_model/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..427abc5179a9c1573bde250175a84acdb13acb5a
--- /dev/null
+++ b/checkpoint-5600/adapter_model/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e96ff867e21cc9653b08a6604c2b9fee34b49567f39bc3b5219920c59a1ad479
+size 500897101
diff --git a/checkpoint-5600/optimizer.pt b/checkpoint-5600/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..e0fbdf4d0a53fbf8f9394431ee4fb0d3982604ec
--- /dev/null
+++ b/checkpoint-5600/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df47db77572b5903eee04a46dab5d058c91d6beb23a0c788c4e7a5ff96c06106
+size 1001752701
diff --git a/checkpoint-5600/rng_state_0.pth b/checkpoint-5600/rng_state_0.pth
new file mode 100644
index 0000000000000000000000000000000000000000..400f0b99223b4a2b6ff573b6179ecd47f631f0ab
--- /dev/null
+++ b/checkpoint-5600/rng_state_0.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2649527449cc7bab876f24864f3a04b696ce2041881461ec304e8e720f5c2731
+size 27772
diff --git a/checkpoint-5600/rng_state_1.pth b/checkpoint-5600/rng_state_1.pth
new file mode 100644
index 0000000000000000000000000000000000000000..2be91acf27fb464aec769cdf1ae4ca2e704c738a
--- /dev/null
+++ b/checkpoint-5600/rng_state_1.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae037bf942f3d5243bbe7c3db837eb84dcd51095ec0ba382f43a17d0c0c87f5b
+size 27772
diff --git a/checkpoint-5600/rng_state_10.pth b/checkpoint-5600/rng_state_10.pth
new file mode 100644
index 0000000000000000000000000000000000000000..e59ba6d28072b1c441e071b56698aac69fed5117
--- /dev/null
+++ b/checkpoint-5600/rng_state_10.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d09be680de783308c5b6c5c5c75f1cf1b7e91ec7dbf0ccc24e0e1adea4c8acd
+size 27789
diff --git a/checkpoint-5600/rng_state_11.pth b/checkpoint-5600/rng_state_11.pth
new file mode 100644
index 0000000000000000000000000000000000000000..9de92cb383dcef1347b179fe9b8d5ec38ee15c3e
--- /dev/null
+++ b/checkpoint-5600/rng_state_11.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72fe3e4408208255a5fc68fcce1f01d10c7f1eae3f2c7548666160ee70f0e6aa
+size 27789
diff --git a/checkpoint-5600/rng_state_12.pth b/checkpoint-5600/rng_state_12.pth
new file mode 100644
index 0000000000000000000000000000000000000000..1c5dfd7ae4a944d2633a0f570b01b0eb9cbda76e
--- /dev/null
+++ b/checkpoint-5600/rng_state_12.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0960c791386b2315bfdb5dc6eb00805451f82b5884e14fa0e8b5f9e824859ff
+size 27789
diff --git a/checkpoint-5600/rng_state_13.pth b/checkpoint-5600/rng_state_13.pth
new file mode 100644
index 0000000000000000000000000000000000000000..7691410b7970e8c4b5c94ebe8b13e01319206818
--- /dev/null
+++ b/checkpoint-5600/rng_state_13.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:732bbec507cf39b6e24310e2184b2d9b1837e907f6677563fd5c6f9891d7a8de
+size 27789
diff --git a/checkpoint-5600/rng_state_2.pth b/checkpoint-5600/rng_state_2.pth
new file mode 100644
index 0000000000000000000000000000000000000000..1d392ab1a2e830ddde436953957e80c79a7077ed
--- /dev/null
+++ b/checkpoint-5600/rng_state_2.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ce44f1432aaa2d64261a1f7fbc6a5482030d9f8a9fffc628a7cdebce9ee27a6
+size 27772
diff --git a/checkpoint-5600/rng_state_3.pth b/checkpoint-5600/rng_state_3.pth
new file mode 100644
index 0000000000000000000000000000000000000000..ead0be94ffa333db9e7905e81a8fa62d2bad5d69
--- /dev/null
+++ b/checkpoint-5600/rng_state_3.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c025a89c9d90fd82a35542e443baf062744f6456e92fe3bcf602fa5825c4f3e
+size 27772
diff --git a/checkpoint-5600/rng_state_4.pth b/checkpoint-5600/rng_state_4.pth
new file mode 100644
index 0000000000000000000000000000000000000000..78f05a6a3410eb5c9db1d7e3137a8e56044e95b9
--- /dev/null
+++ b/checkpoint-5600/rng_state_4.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a516cb688f1dc31792fb91446d23ded3a5796e4dc99dd525d9bac5f9dc529c35
+size 27772
diff --git a/checkpoint-5600/rng_state_5.pth b/checkpoint-5600/rng_state_5.pth
new file mode 100644
index 0000000000000000000000000000000000000000..76f3854f263fe2c261868a0160dd999cb2499026
--- /dev/null
+++ b/checkpoint-5600/rng_state_5.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f7823690621e69b2981b133b63eb5a80a23490616d48dc63cb760e86e38604a
+size 27772
diff --git a/checkpoint-5600/rng_state_6.pth b/checkpoint-5600/rng_state_6.pth
new file mode 100644
index 0000000000000000000000000000000000000000..9b5aaf73005a165301ae66b9dc4272d38c4ec85b
--- /dev/null
+++ b/checkpoint-5600/rng_state_6.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18df96fd55552e3861ed458fc798b0c3920f65c1ce37c6cc620c9e50505a7e09
+size 27772
diff --git a/checkpoint-5600/rng_state_7.pth b/checkpoint-5600/rng_state_7.pth
new file mode 100644
index 0000000000000000000000000000000000000000..19412ea18371d748e653a42aba6abeaedfa8bbc1
--- /dev/null
+++ b/checkpoint-5600/rng_state_7.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84f81d3438f9d778b8103678ab771741f7b2225c3019a7cfc2e9c229006c5413
+size 27772
diff --git a/checkpoint-5600/rng_state_8.pth b/checkpoint-5600/rng_state_8.pth
new file mode 100644
index 0000000000000000000000000000000000000000..83f0aaf0a98801f5e36eaaf7c376c438f1e7f02b
--- /dev/null
+++ b/checkpoint-5600/rng_state_8.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d5b70e93fcc996c03cc042b239463bcc53073b6d9ed06b24e1269d510cb89df
+size 27772
diff --git a/checkpoint-5600/rng_state_9.pth b/checkpoint-5600/rng_state_9.pth
new file mode 100644
index 0000000000000000000000000000000000000000..0b891a65ce49471ffa81bef6f5673197f206205c
--- /dev/null
+++ b/checkpoint-5600/rng_state_9.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a90f3084f765b30672ebf421b021b4022b5f3d36076be9073a91796e1a6089b1
+size 27772
diff --git a/checkpoint-5600/scheduler.pt b/checkpoint-5600/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..2cd78806480121e3ea9f28152ce36ad0e0f05faa
--- /dev/null
+++ b/checkpoint-5600/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b513b0465d40001c6314a5a4b4dc290c6baefd28e2877ca89d7e28757ae1791
+size 627
diff --git a/checkpoint-5100/trainer_state.json b/checkpoint-5600/trainer_state.json
similarity index 91%
rename from checkpoint-5100/trainer_state.json
rename to checkpoint-5600/trainer_state.json
index 31f9ead56164f53bb88ae75076a62bb58974bed0..0f4cbe52d86850b9d7cc6d7dd5bb106474d0cae3 100644
--- a/checkpoint-5100/trainer_state.json
+++ b/checkpoint-5600/trainer_state.json
@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.9775106630476929,
-  "global_step": 5100,
+  "epoch": 2.1713842574641333,
+  "global_step": 5600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1246,11 +1246,131 @@
       "learning_rate": 5.21748855202839e-05,
       "loss": 0.7868,
       "step": 5100
+    },
+    {
+      "epoch": 1.99,
+      "learning_rate": 5.128471597058342e-05,
+      "loss": 0.7993,
+      "step": 5125
+    },
+    {
+      "epoch": 2.0,
+      "learning_rate": 5.03995793340572e-05,
+      "loss": 0.7892,
+      "step": 5150
+    },
+    {
+      "epoch": 2.01,
+      "learning_rate": 4.9519567056663694e-05,
+      "loss": 0.7788,
+      "step": 5175
+    },
+    {
+      "epoch": 2.02,
+      "learning_rate": 4.864477005494938e-05,
+      "loss": 0.7654,
+      "step": 5200
+    },
+    {
+      "epoch": 2.03,
+      "learning_rate": 4.777527870665592e-05,
+      "loss": 0.7468,
+      "step": 5225
+    },
+    {
+      "epoch": 2.04,
+      "learning_rate": 4.691118284138296e-05,
+      "loss": 0.7359,
+      "step": 5250
+    },
+    {
+      "epoch": 2.05,
+      "learning_rate": 4.605257173130763e-05,
+      "loss": 0.7422,
+      "step": 5275
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.519953408196152e-05,
+      "loss": 0.7424,
+      "step": 5300
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.435215802306635e-05,
+      "loss": 0.7521,
+      "step": 5325
+    },
+    {
+      "epoch": 2.07,
+      "learning_rate": 4.351053109942894e-05,
+      "loss": 0.7477,
+      "step": 5350
+    },
+    {
+      "epoch": 2.08,
+      "learning_rate": 4.2674740261896776e-05,
+      "loss": 0.7456,
+      "step": 5375
+    },
+    {
+      "epoch": 2.09,
+      "learning_rate": 4.1844871858374844e-05,
+      "loss": 0.766,
+      "step": 5400
+    },
+    {
+      "epoch": 2.1,
+      "learning_rate": 4.1021011624904814e-05,
+      "loss": 0.7664,
+      "step": 5425
+    },
+    {
+      "epoch": 2.11,
+      "learning_rate": 4.0203244676807353e-05,
+      "loss": 0.7703,
+      "step": 5450
+    },
+    {
+      "epoch": 2.12,
+      "learning_rate": 3.939165549988873e-05,
+      "loss": 0.7674,
+      "step": 5475
+    },
+    {
+      "epoch": 2.13,
+      "learning_rate": 3.858632794171222e-05,
+      "loss": 0.7722,
+      "step": 5500
+    },
+    {
+      "epoch": 2.14,
+      "learning_rate": 3.778734520293562e-05,
+      "loss": 0.7716,
+      "step": 5525
+    },
+    {
+      "epoch": 2.15,
+      "learning_rate": 3.699478982871561e-05,
+      "loss": 0.7795,
+      "step": 5550
+    },
+    {
+      "epoch": 2.16,
+      "learning_rate": 3.62087437001797e-05,
+      "loss": 0.7728,
+      "step": 5575
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 3.5429288025966944e-05,
+      "loss": 0.7709,
+      "step": 5600
     }
   ],
   "max_steps": 7737,
   "num_train_epochs": 3,
-  "total_flos": 2.1963895120276226e+19,
+  "total_flos": 2.4117470741298938e+19,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/checkpoint-5600/training_args.bin b/checkpoint-5600/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1
--- /dev/null
+++ b/checkpoint-5600/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6
+size 4027
diff --git a/checkpoint-5300/README.md b/checkpoint-5700/README.md
similarity index 100%
rename from checkpoint-5300/README.md
rename to checkpoint-5700/README.md
diff --git a/checkpoint-5200/adapter_config.json b/checkpoint-5700/adapter_config.json
similarity index 94%
rename from checkpoint-5200/adapter_config.json
rename to checkpoint-5700/adapter_config.json
index 9562283fecc55d7524b16dcc7b9d9a5daf36f0df..7052646debaf453de93d6176727714122c31b64a 100644
--- a/checkpoint-5200/adapter_config.json
+++ b/checkpoint-5700/adapter_config.json
@@ -14,13 +14,13 @@
   "r": 32,
   "revision": null,
   "target_modules": [
+    "q_proj",
     "v_proj",
+    "gate_proj",
     "up_proj",
+    "o_proj",
     "k_proj",
-    "q_proj",
-    "down_proj",
-    "gate_proj",
-    "o_proj"
+    "down_proj"
   ],
   "task_type": "CAUSAL_LM"
 }
\ No newline at end of file
diff --git a/checkpoint-5700/adapter_model.bin b/checkpoint-5700/adapter_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..02526e93c7101a3c9d0727acfe024831696398f1
--- /dev/null
+++ b/checkpoint-5700/adapter_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95
+size 500897101
diff --git a/checkpoint-5700/optimizer.pt b/checkpoint-5700/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..8d3c8aee3e9ab00a5c3caededd68fa2b6406534b
--- /dev/null
+++ b/checkpoint-5700/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8847b7875d322ad5570a300587a0f3924a360ae4df3e2feeb97a8a2e21a3cbff
+size 1001752701
diff --git a/checkpoint-5700/rng_state_0.pth b/checkpoint-5700/rng_state_0.pth
new file mode 100644
index 0000000000000000000000000000000000000000..3c2a9137bfd1f9c3efd5228cb92aa36dc82cc29a
--- /dev/null
+++ b/checkpoint-5700/rng_state_0.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f06ce8fd6a33ec4407e0888bbcc8c7e40f4d820c9b7b7024f808c1cb08bac1f9
+size 27772
diff --git a/checkpoint-5700/rng_state_1.pth b/checkpoint-5700/rng_state_1.pth
new file mode 100644
index 0000000000000000000000000000000000000000..07bb8ba3171f9114ca378631f850b16a8ca02a83
--- /dev/null
+++ b/checkpoint-5700/rng_state_1.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:218ef7d643b85f18451d0ff4e11963ac2483f153fb71cc3ca1ab2bc1c0c67051
+size 27772
diff --git a/checkpoint-5700/rng_state_10.pth b/checkpoint-5700/rng_state_10.pth
new file mode 100644
index 0000000000000000000000000000000000000000..62f27578ae3c5f05071b9cf5c702eeb81bc6d415
--- /dev/null
+++ b/checkpoint-5700/rng_state_10.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d52fed50c25d75d7fa962b9f10f71f848700ff11f9305a37b16ca126fee5481
+size 27789
diff --git a/checkpoint-5700/rng_state_11.pth b/checkpoint-5700/rng_state_11.pth
new file mode 100644
index 0000000000000000000000000000000000000000..c2efdd8e880e555c19f213e77989c03985c1fd8a
--- /dev/null
+++ b/checkpoint-5700/rng_state_11.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca4cdcdc956f43b62d0d18dc1d662748eb79bf6714c90145fc90101a1ea2249d
+size 27789
diff --git a/checkpoint-5700/rng_state_12.pth b/checkpoint-5700/rng_state_12.pth
new file mode 100644
index 0000000000000000000000000000000000000000..35ffc9df08e4edd6abf3d1d242d2d90918445da0
--- /dev/null
+++ b/checkpoint-5700/rng_state_12.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8305db4caf39e6fd5e1f06f849d2a6d65681cf5c367dd8a754a886f1d32d4456
+size 27789
diff --git a/checkpoint-5700/rng_state_13.pth b/checkpoint-5700/rng_state_13.pth
new file mode 100644
index 0000000000000000000000000000000000000000..9951d89ea973b30e68cd7319d1009ce908729213
--- /dev/null
+++ b/checkpoint-5700/rng_state_13.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd9d3dc3cf0abd594c579dd75cbe79170df6d02cec6c38d47e042b3dd26300d9
+size 27789
diff --git a/checkpoint-5700/rng_state_2.pth b/checkpoint-5700/rng_state_2.pth
new file mode 100644
index 0000000000000000000000000000000000000000..8d36198d13637177c88509187eec27963707dbc4
--- /dev/null
+++ b/checkpoint-5700/rng_state_2.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:348612a8cf3a488b2de324430f631e10c4e8156112e6c50cecda44157e829595
+size 27772
diff --git a/checkpoint-5700/rng_state_3.pth b/checkpoint-5700/rng_state_3.pth
new file mode 100644
index 0000000000000000000000000000000000000000..8f72210cf61d845505e06c0f681a11f782d2d543
--- /dev/null
+++ b/checkpoint-5700/rng_state_3.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c688a5f058c380a72ea06519f8b004106c3bf62f4ac8ae5b0e96c473dbac963c
+size 27772
diff --git a/checkpoint-5700/rng_state_4.pth b/checkpoint-5700/rng_state_4.pth
new file mode 100644
index 0000000000000000000000000000000000000000..062d0bace80c1db35317fbd29fd2698c02cb8cd8
--- /dev/null
+++ b/checkpoint-5700/rng_state_4.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:20ebd3abf1496a95cb8a1cc494c974137f7880bb1069b7813817b8600444464d
+size 27772
diff --git a/checkpoint-5700/rng_state_5.pth b/checkpoint-5700/rng_state_5.pth
new file mode 100644
index 0000000000000000000000000000000000000000..337c9b58db07231bee27e8d458d57f2f970e7da4
--- /dev/null
+++ b/checkpoint-5700/rng_state_5.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0ad3339005efdbfae3bb272ea3ce0907371f54b4834a96fa9c864807063f63d
+size 27772
diff --git a/checkpoint-5700/rng_state_6.pth b/checkpoint-5700/rng_state_6.pth
new file mode 100644
index 0000000000000000000000000000000000000000..b6b7bdf4e47fc358d7c2daa8c1e04e4eae152289
--- /dev/null
+++ b/checkpoint-5700/rng_state_6.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f13556a5091d1d8f3874fe4a97ac3fc222b586812ceab6167e99bc25dc28fc0
+size 27772
diff --git a/checkpoint-5700/rng_state_7.pth b/checkpoint-5700/rng_state_7.pth
new file mode 100644
index 0000000000000000000000000000000000000000..c2beb3e1bd8f4fe6a018c96e8cc80233ad1384b9
--- /dev/null
+++ b/checkpoint-5700/rng_state_7.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b76a223c2ea9e5262b69fc056b9f29e0dd62a728f58a99ac77374aeb72fce68
+size 27772
diff --git a/checkpoint-5700/rng_state_8.pth b/checkpoint-5700/rng_state_8.pth
new file mode 100644
index 0000000000000000000000000000000000000000..73e55c77fc49eb5929193d73402cd3d20c1f563e
--- /dev/null
+++ b/checkpoint-5700/rng_state_8.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae0f14b82c516564368a80f0d993ef826bf389434bdd326ac982efc3e52dc286
+size 27772
diff --git a/checkpoint-5700/rng_state_9.pth b/checkpoint-5700/rng_state_9.pth
new file mode 100644
index 0000000000000000000000000000000000000000..c7da4b43531a42c31650b4c283559a7d8f311a95
--- /dev/null
+++ b/checkpoint-5700/rng_state_9.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff589c2de9aa0e8b005f5e548e65245c51b773411b16d01c505e9d491673af3f
+size 27772
diff --git a/checkpoint-5700/scheduler.pt b/checkpoint-5700/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..7e36ca6a96764eeccb6aa7d9c5028585fed23370
--- /dev/null
+++ b/checkpoint-5700/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:935f0139e1e2ffb90e75a6a1904fe50b37854f0d00a6d9b7dc07c85fc7a0d97c
+size 627
diff --git a/checkpoint-5000/trainer_state.json b/checkpoint-5700/trainer_state.json
similarity index 87%
rename from checkpoint-5000/trainer_state.json
rename to checkpoint-5700/trainer_state.json
index af780eb13311ced739f9badd8713c039b76bfa10..8c4091dad201566e2ffa5b495ce638f306686a5e 100644
--- a/checkpoint-5000/trainer_state.json
+++ b/checkpoint-5700/trainer_state.json
@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.9387359441644048,
-  "global_step": 5000,
+  "epoch": 2.2101589763474214,
+  "global_step": 5700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1222,11 +1222,179 @@
       "eval_samples_per_second": 12.251,
       "eval_steps_per_second": 0.889,
       "step": 5000
+    },
+    {
+      "epoch": 1.95,
+      "learning_rate": 5.487466944644033e-05,
+      "loss": 0.7902,
+      "step": 5025
+    },
+    {
+      "epoch": 1.96,
+      "learning_rate": 5.3969954985052996e-05,
+      "loss": 0.7979,
+      "step": 5050
+    },
+    {
+      "epoch": 1.97,
+      "learning_rate": 5.306999601723579e-05,
+      "loss": 0.7931,
+      "step": 5075
+    },
+    {
+      "epoch": 1.98,
+      "learning_rate": 5.21748855202839e-05,
+      "loss": 0.7868,
+      "step": 5100
+    },
+    {
+      "epoch": 1.99,
+      "learning_rate": 5.128471597058342e-05,
+      "loss": 0.7993,
+      "step": 5125
+    },
+    {
+      "epoch": 2.0,
+      "learning_rate": 5.03995793340572e-05,
+      "loss": 0.7892,
+      "step": 5150
+    },
+    {
+      "epoch": 2.01,
+      "learning_rate": 4.9519567056663694e-05,
+      "loss": 0.7788,
+      "step": 5175
+    },
+    {
+      "epoch": 2.02,
+      "learning_rate": 4.864477005494938e-05,
+      "loss": 0.7654,
+      "step": 5200
+    },
+    {
+      "epoch": 2.03,
+      "learning_rate": 4.777527870665592e-05,
+      "loss": 0.7468,
+      "step": 5225
+    },
+    {
+      "epoch": 2.04,
+      "learning_rate": 4.691118284138296e-05,
+      "loss": 0.7359,
+      "step": 5250
+    },
+    {
+      "epoch": 2.05,
+      "learning_rate": 4.605257173130763e-05,
+      "loss": 0.7422,
+      "step": 5275
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.519953408196152e-05,
+      "loss": 0.7424,
+      "step": 5300
+    },
+    {
+      "epoch": 2.06,
+      "learning_rate": 4.435215802306635e-05,
+      "loss": 0.7521,
+      "step": 5325
+    },
+    {
+      "epoch": 2.07,
+      "learning_rate": 4.351053109942894e-05,
+      "loss": 0.7477,
+      "step": 5350
+    },
+    {
+      "epoch": 2.08,
+      "learning_rate": 4.2674740261896776e-05,
+      "loss": 0.7456,
+      "step": 5375
+    },
+    {
+      "epoch": 2.09,
+      "learning_rate": 4.1844871858374844e-05,
+      "loss": 0.766,
+      "step": 5400
+    },
+    {
+      "epoch": 2.1,
+      "learning_rate": 4.1021011624904814e-05,
+      "loss": 0.7664,
+      "step": 5425
+    },
+    {
+      "epoch": 2.11,
+      "learning_rate": 4.0203244676807353e-05,
+      "loss": 0.7703,
+      "step": 5450
+    },
+    {
+      "epoch": 2.12,
+      "learning_rate": 3.939165549988873e-05,
+      "loss": 0.7674,
+      "step": 5475
+    },
+    {
+      "epoch": 2.13,
+      "learning_rate": 3.858632794171222e-05,
+      "loss": 0.7722,
+      "step": 5500
+    },
+    {
+      "epoch": 2.14,
+      "learning_rate": 3.778734520293562e-05,
+      "loss": 0.7716,
+      "step": 5525
+    },
+    {
+      "epoch": 2.15,
+      "learning_rate": 3.699478982871561e-05,
+      "loss": 0.7795,
+      "step": 5550
+    },
+    {
+      "epoch": 2.16,
+      "learning_rate": 3.62087437001797e-05,
+      "loss": 0.7728,
+      "step": 5575
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 3.5429288025966944e-05,
+      "loss": 0.7709,
+      "step": 5600
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 3.4656503333837956e-05,
+      "loss": 0.7682,
+      "step": 5625
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 3.389046946235542e-05,
+      "loss": 0.7734,
+      "step": 5650
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 3.313126555263576e-05,
+      "loss": 0.7716,
+      "step": 5675
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 3.237897004017276e-05,
+      "loss": 0.7716,
+      "step": 5700
     }
   ],
   "max_steps": 7737,
   "num_train_epochs": 3,
-  "total_flos": 2.1532695573582316e+19,
+  "total_flos": 2.4549667828507083e+19,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/checkpoint-5700/training_args.bin b/checkpoint-5700/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c456116f688fe6cb6deecb1e0a1cf8d153d349fb
--- /dev/null
+++ b/checkpoint-5700/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2
+size 4027
diff --git a/training_args.bin b/training_args.bin
index ed2c87b3546aa7b8ec35fe3fa8e1331e669a72a1..c456116f688fe6cb6deecb1e0a1cf8d153d349fb 100644
--- a/training_args.bin
+++ b/training_args.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:689d52379bcc7c50e04c40b22a97b473b8de3f17b4096bebf81eb9f37e1dafa6
+oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2
 size 4027