trapoom555 commited on Jun 5

Commit

e287de6

•

1 Parent(s): cf66735

delete optimizer state

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.DS_Store +0 -0
checkpoint-10/optimizer.pt +0 -3
checkpoint-10/rng_state_0.pth +0 -3
checkpoint-10/rng_state_1.pth +0 -3
checkpoint-10/rng_state_2.pth +0 -3
checkpoint-10/rng_state_3.pth +0 -3
checkpoint-10/scheduler.pt +0 -3
checkpoint-10/trainer_state.json +0 -28
checkpoint-100/optimizer.pt +0 -3
checkpoint-100/rng_state_0.pth +0 -3
checkpoint-100/rng_state_1.pth +0 -3
checkpoint-100/rng_state_2.pth +0 -3
checkpoint-100/rng_state_3.pth +0 -3
checkpoint-100/scheduler.pt +0 -3
checkpoint-100/trainer_state.json +0 -91
checkpoint-110/optimizer.pt +0 -3
checkpoint-110/rng_state_0.pth +0 -3
checkpoint-110/rng_state_1.pth +0 -3
checkpoint-110/rng_state_2.pth +0 -3
checkpoint-110/rng_state_3.pth +0 -3
checkpoint-110/scheduler.pt +0 -3
checkpoint-110/trainer_state.json +0 -98
checkpoint-120/optimizer.pt +0 -3
checkpoint-120/rng_state_0.pth +0 -3
checkpoint-120/rng_state_1.pth +0 -3
checkpoint-120/rng_state_2.pth +0 -3
checkpoint-120/rng_state_3.pth +0 -3
checkpoint-120/scheduler.pt +0 -3
checkpoint-120/trainer_state.json +0 -105
checkpoint-130/optimizer.pt +0 -3
checkpoint-130/rng_state_0.pth +0 -3
checkpoint-130/rng_state_1.pth +0 -3
checkpoint-130/rng_state_2.pth +0 -3
checkpoint-130/rng_state_3.pth +0 -3
checkpoint-130/scheduler.pt +0 -3
checkpoint-130/trainer_state.json +0 -112
checkpoint-140/optimizer.pt +0 -3
checkpoint-140/rng_state_0.pth +0 -3
checkpoint-140/rng_state_1.pth +0 -3
checkpoint-140/rng_state_2.pth +0 -3
checkpoint-140/rng_state_3.pth +0 -3
checkpoint-140/scheduler.pt +0 -3
checkpoint-140/trainer_state.json +0 -119
checkpoint-150/optimizer.pt +0 -3
checkpoint-150/rng_state_0.pth +0 -3
checkpoint-150/rng_state_1.pth +0 -3
checkpoint-150/rng_state_2.pth +0 -3
checkpoint-150/rng_state_3.pth +0 -3
checkpoint-150/scheduler.pt +0 -3
checkpoint-150/trainer_state.json +0 -126

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

checkpoint-10/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1aef16bd447fb0d9ab7ea589a7a66dfdef7306cdb918a22458512ff587b68a64
-size 11930938

checkpoint-10/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:279c231f7db5849b53ea6f61278709c8be27bcc46fc1b36100377bf36c55cfb9
-size 15024

checkpoint-10/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:35738ebb9e53709608b7f4feaf1edbde1a19901d813f15922153ded80ead6540
-size 15024

checkpoint-10/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3f411b8c60d90c0733bb03c4955ea2e40ab35464f214cb47cc4d6d0eaa83bc79
-size 15024

checkpoint-10/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7224ff493b87486a3e2c3001115ad539913e8fe95cf25f4bcae3236f97e83f41
-size 15024

checkpoint-10/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:132a4d8a2402b42567b2e1dc1c6a48bad549652509953ce872ad2e01b1912ad5
-size 1064

checkpoint-10/trainer_state.json DELETED Viewed

@@ -1,28 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.0007256367462448298,
-  "eval_steps": 500,
-  "global_step": 10,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-100/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9381ae68692ba2b7341ae855c90812a5fbafbc8e14556f3ac4dbaad16be047d4
-size 11930938

checkpoint-100/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:85f43e42ff30186bb51f3d90dcd7d261d6e09960636961fd696f9478303d1331
-size 15024

checkpoint-100/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:daf210db9013b20416569b6811b878570fbbf461f867de41a8a69fd07f0d2c8c
-size 15024

checkpoint-100/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:132e0dad8f05cba3da38386b81951c801df7c5c2c1cf9e06b5d359b7b92422da
-size 15024

checkpoint-100/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:441e2aab46e3935d5d49029fda3ebaf07053ac3a8e8a6eb7aca038ab1127bea1
-size 15024

checkpoint-100/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:19f5d0bbf212c73b040975411809641839aa3caa43c4a2c866ebc22031333594
-size 1064

checkpoint-100/trainer_state.json DELETED Viewed

@@ -1,91 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.007256367462448298,
-  "eval_steps": 500,
-  "global_step": 100,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-110/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:71f7bccb601f5f4e4763183e247a17255e58030897d43de1d0aeceda220c00d0
-size 11930938

checkpoint-110/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ac95db18ae6a1e414f19563e15335ec1a3d44d5b26a3896a591a42bf53daac57
-size 15024

checkpoint-110/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9ad2adf8c9d84012d5c08bc34b7d7b7bd8f571238b97deba7b563bc8579f284e
-size 15024

checkpoint-110/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d02fc29e95ce367f0b8273bbbf6e41186c317282c9a486968d768ffcb716f8dd
-size 15024

checkpoint-110/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:540b9cf222feb8019c875aee3fd37ce5b892ea395b93ddd0b75459462687e321
-size 15024

checkpoint-110/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d11c04331c4b18b97e6fd3b7cb5a000c7ab23c225c4db79a1ee75e81b9696471
-size 1064

checkpoint-110/trainer_state.json DELETED Viewed

@@ -1,98 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.007982004208693128,
-  "eval_steps": 500,
-  "global_step": 110,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    },
-    {
-      "epoch": 0.007982004208693128,
-      "grad_norm": 4.8125,
-      "learning_rate": 0.00499999340865746,
-      "loss": 0.6463,
-      "step": 110
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-120/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:eab12cdf8889aad166eb799741b5090d64aef98d1cf4e9180e44a52269265bca
-size 11930938

checkpoint-120/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e010d5c5e5ff459e09cee093e035058bce80bd0e562b9008cf49e37a37c4a265
-size 15024

checkpoint-120/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8ceaec8c84867fda1405ca685c206ff5498d51b755970edb435f4777d1649c24
-size 15024

checkpoint-120/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:791eebd4302125380e3da4e87668a4bb1db8af54a2e9f9519cb225a5eefb78b6
-size 15024

checkpoint-120/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7b5e8577ac55da749e71c292571c66ba7068eaeeac8f69a2d9ecb004c4ea24df
-size 15024

checkpoint-120/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ff6b053b58138104c7022211d92f7de7c9f99a3edfbe310bf788eced5771619e
-size 1064

checkpoint-120/trainer_state.json DELETED Viewed

@@ -1,105 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.008707640954937958,
-  "eval_steps": 500,
-  "global_step": 120,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    },
-    {
-      "epoch": 0.007982004208693128,
-      "grad_norm": 4.8125,
-      "learning_rate": 0.00499999340865746,
-      "loss": 0.6463,
-      "step": 110
-    },
-    {
-      "epoch": 0.008707640954937958,
-      "grad_norm": 13.9375,
-      "learning_rate": 0.004999973634664594,
-      "loss": 0.8034,
-      "step": 120
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-130/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:da0f042da58b28662f4d868e48004ee48f5f84292a362709bc1991944d6436e9
-size 11930938

checkpoint-130/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7ced0c6ba13f477a0dbd44034592fe000f226e71898cbab5bf87ce59dc6bde36
-size 15024

checkpoint-130/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e97d793be909b79220b59b211d87fda9d35184d2305c00641e9b4531b73b8441
-size 15024

checkpoint-130/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:60416c656b12aaecd01e32e964532f371c0a6b02a4b9b91ccfdc35d45dce0050
-size 15024

checkpoint-130/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:218ddffb5978f25094e6ad3cfbfc85ad7b807a183e3bc9f6f15bd471542d7273
-size 15024

checkpoint-130/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7a7e64623a110e28d04bb4716eebddb4a4312d0694ae043b9f61172fbeab0c03
-size 1064

checkpoint-130/trainer_state.json DELETED Viewed

@@ -1,112 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.009433277701182788,
-  "eval_steps": 500,
-  "global_step": 130,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    },
-    {
-      "epoch": 0.007982004208693128,
-      "grad_norm": 4.8125,
-      "learning_rate": 0.00499999340865746,
-      "loss": 0.6463,
-      "step": 110
-    },
-    {
-      "epoch": 0.008707640954937958,
-      "grad_norm": 13.9375,
-      "learning_rate": 0.004999973634664594,
-      "loss": 0.8034,
-      "step": 120
-    },
-    {
-      "epoch": 0.009433277701182788,
-      "grad_norm": 4.71875,
-      "learning_rate": 0.004999940678125673,
-      "loss": 0.9929,
-      "step": 130
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-140/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f515cbf176e5a7beb082e5a29035fa3c505d65ee772ea9b8701a482868425672
-size 11930938

checkpoint-140/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6ad67dbef2a21b26f3117ca45d621957bf72b1116535cf6e524b17661b94b1a9
-size 15024

checkpoint-140/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ca3afd4f067268e4c6ff34242266c9e70bce106dd4d7365781bb893119a4033d
-size 15024

checkpoint-140/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f7a56e9bc058e763d68d477e80d923c2fe559a75d518ac8d5d693397a88304b3
-size 15024

checkpoint-140/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8aef494a54b19f2a6c92fb251d8acadbfc7c21bcba926f5a7f5fa134981bb678
-size 15024

checkpoint-140/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:08ad8017df34c80a966f2de030fef490dd964b53e9d7026af7b314d0fb2202de
-size 1064

checkpoint-140/trainer_state.json DELETED Viewed

@@ -1,119 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.010158914447427617,
-  "eval_steps": 500,
-  "global_step": 140,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    },
-    {
-      "epoch": 0.007982004208693128,
-      "grad_norm": 4.8125,
-      "learning_rate": 0.00499999340865746,
-      "loss": 0.6463,
-      "step": 110
-    },
-    {
-      "epoch": 0.008707640954937958,
-      "grad_norm": 13.9375,
-      "learning_rate": 0.004999973634664594,
-      "loss": 0.8034,
-      "step": 120
-    },
-    {
-      "epoch": 0.009433277701182788,
-      "grad_norm": 4.71875,
-      "learning_rate": 0.004999940678125673,
-      "loss": 0.9929,
-      "step": 130
-    },
-    {
-      "epoch": 0.010158914447427617,
-      "grad_norm": 6.375,
-      "learning_rate": 0.00499989453921448,
-      "loss": 0.8968,
-      "step": 140
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-150/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:79595e55006cb0b15a70ea23b98850bf2405eceaab7b27197afb23e09f2a0be8
-size 11930938

checkpoint-150/rng_state_0.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c342af2ce35811f7314d04dcf27fe047ef7a2c2c65a53827cf5bfa3bbef9abbb
-size 15024

checkpoint-150/rng_state_1.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:732cda9265841aab840d0742ab54e81d4890cc436da4ad72a7491a2de6e456cd
-size 15024

checkpoint-150/rng_state_2.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b9e93aaf91c3d45dc0a00b2862a0b23147bc87200884e67202507624081ba206
-size 15024

checkpoint-150/rng_state_3.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:bde38e9c7ebd4dcc6310f8e51cdb47e2f01b8ae902f2ef5613c6f4a36b2b5231
-size 15024

checkpoint-150/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9524decd0642f99483e902dfa82e4538a022415cedbf6a5f6e945ab4e631653e
-size 1064

checkpoint-150/trainer_state.json DELETED Viewed

@@ -1,126 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.010884551193672447,
-  "eval_steps": 500,
-  "global_step": 150,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0007256367462448298,
-      "grad_norm": 7.3125,
-      "learning_rate": 0.0005,
-      "loss": 2.3531,
-      "step": 10
-    },
-    {
-      "epoch": 0.0014512734924896596,
-      "grad_norm": 2.171875,
-      "learning_rate": 0.001,
-      "loss": 0.6359,
-      "step": 20
-    },
-    {
-      "epoch": 0.0021769102387344894,
-      "grad_norm": 3.46875,
-      "learning_rate": 0.0015,
-      "loss": 0.4216,
-      "step": 30
-    },
-    {
-      "epoch": 0.0029025469849793192,
-      "grad_norm": 2.75,
-      "learning_rate": 0.002,
-      "loss": 0.2925,
-      "step": 40
-    },
-    {
-      "epoch": 0.003628183731224149,
-      "grad_norm": 2.5,
-      "learning_rate": 0.0025,
-      "loss": 0.5181,
-      "step": 50
-    },
-    {
-      "epoch": 0.004353820477468979,
-      "grad_norm": 3.890625,
-      "learning_rate": 0.003,
-      "loss": 0.3559,
-      "step": 60
-    },
-    {
-      "epoch": 0.005079457223713809,
-      "grad_norm": 2.453125,
-      "learning_rate": 0.0034999999999999996,
-      "loss": 0.3521,
-      "step": 70
-    },
-    {
-      "epoch": 0.0058050939699586385,
-      "grad_norm": 2.921875,
-      "learning_rate": 0.004,
-      "loss": 0.6553,
-      "step": 80
-    },
-    {
-      "epoch": 0.006530730716203468,
-      "grad_norm": 5.78125,
-      "learning_rate": 0.0045000000000000005,
-      "loss": 0.5693,
-      "step": 90
-    },
-    {
-      "epoch": 0.007256367462448298,
-      "grad_norm": 3.9375,
-      "learning_rate": 0.005,
-      "loss": 0.4836,
-      "step": 100
-    },
-    {
-      "epoch": 0.007982004208693128,
-      "grad_norm": 4.8125,
-      "learning_rate": 0.00499999340865746,
-      "loss": 0.6463,
-      "step": 110
-    },
-    {
-      "epoch": 0.008707640954937958,
-      "grad_norm": 13.9375,
-      "learning_rate": 0.004999973634664594,
-      "loss": 0.8034,
-      "step": 120
-    },
-    {
-      "epoch": 0.009433277701182788,
-      "grad_norm": 4.71875,
-      "learning_rate": 0.004999940678125673,
-      "loss": 0.9929,
-      "step": 130
-    },
-    {
-      "epoch": 0.010158914447427617,
-      "grad_norm": 6.375,
-      "learning_rate": 0.00499989453921448,
-      "loss": 0.8968,
-      "step": 140
-    },
-    {
-      "epoch": 0.010884551193672447,
-      "grad_norm": 1.984375,
-      "learning_rate": 0.004999835218174307,
-      "loss": 3.9939,
-      "step": 150
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 13781,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 10,
-  "total_flos": 0.0,
-  "train_batch_size": 5,
-  "trial_name": null,
-  "trial_params": null
-}