Training in progress, epoch 1

Browse files

Files changed (15) hide show

model.safetensors +1 -1
run-1/checkpoint-214/model.safetensors +1 -1
run-1/checkpoint-214/optimizer.pt +1 -1
run-1/checkpoint-214/rng_state.pth +2 -2
run-1/checkpoint-214/scheduler.pt +1 -1
run-1/checkpoint-214/trainer_state.json +11 -11
run-1/checkpoint-214/training_args.bin +1 -1
run-1/checkpoint-428/model.safetensors +1 -1
run-1/checkpoint-428/optimizer.pt +1 -1
run-1/checkpoint-428/rng_state.pth +2 -2
run-1/checkpoint-428/scheduler.pt +1 -1
run-1/checkpoint-428/trainer_state.json +16 -16
run-1/checkpoint-428/training_args.bin +1 -1
runs/Feb28_19-52-39_5620ed9b2fff/events.out.tfevents.1709150660.5620ed9b2fff.209.20 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d93c6bad4aa755b790eb06670d6a1acc1ef67e4d1526c32025acd725542e891
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f18ca5f2049d94fea824128466a0f1820c99900e714cb7783890e8716c29379
 size 267832560

run-1/checkpoint-214/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c045372f29e6a3f37f3f88e140fc38258f54572ecc9ac94f101c483b9cc8c37a
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f18ca5f2049d94fea824128466a0f1820c99900e714cb7783890e8716c29379
 size 267832560

run-1/checkpoint-214/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:baf19709a4bde0c92be57853da99de5c712e40d25f9b8432966f9f3fcc825b31
 size 535727290

 version https://git-lfs.github.com/spec/v1
+oid sha256:3895d006c65cbdefae8e8f45e0a22ff7e61df8b1c088aefaacd886f5064f33f6
 size 535727290

run-1/checkpoint-214/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:027b5232182ab9d7d3bc920386e3c0b3dbe31bc099095d7c97caf72c228cf9c3
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:0652a30494a7551b8120ac6e0902e8c5305fecb27d67d6132c2fc2ce1b8b74e4
+size 14308

run-1/checkpoint-214/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b8745fd222b32e92bd39e730ff84b1164d52c90bc9b5fe05042532ceb0f6c1f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:96e921269274966d3249d7aa3e72de0a66b834a9db0861a1b99aa2a5e02d6d39
 size 1064

run-1/checkpoint-214/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.18118799119487816,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-214",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,26 +10,26 @@
   "log_history": [
     {
       "epoch": 1.0,
-      "eval_loss": 0.6478912234306335,
-      "eval_matthews_correlation": 0.18118799119487816,
-      "eval_runtime": 0.7571,
-      "eval_samples_per_second": 1377.58,
-      "eval_steps_per_second": 87.172,
       "step": 214
     }
   ],
   "logging_steps": 500,
-  "max_steps": 428,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 2,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
-    "learning_rate": 3.45845102664945e-05,
-    "num_train_epochs": 2,
     "per_device_train_batch_size": 4,
-    "seed": 15
   }
 }

 {
+  "best_metric": 0.0835915715371112,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-214",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 1.0,
+      "eval_loss": 0.5719716548919678,
+      "eval_matthews_correlation": 0.0835915715371112,
+      "eval_runtime": 0.6978,
+      "eval_samples_per_second": 1494.771,
+      "eval_steps_per_second": 94.588,
       "step": 214
     }
   ],
   "logging_steps": 500,
+  "max_steps": 642,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
+    "learning_rate": 3.5027277138406044e-05,
+    "num_train_epochs": 3,
     "per_device_train_batch_size": 4,
+    "seed": 29
   }
 }

run-1/checkpoint-214/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f8bfed4abe7904aebfa29146a26419ad532e218a199dc08365bb4ca5a35eafdb
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:824c97682d0b5180a58b29aad975f1f670351c62a61736d4bcfd4286ecc497ee
 size 4984

run-1/checkpoint-428/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8220f206622c6f496381eba1d07bd6ca75d91e74d50afa7e44799ad9c5be7d7d
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:913401d5bbd4d440e84f64d35aadb464db9f13b4cfa4e271b4f24bb732f105eb
 size 267832560

run-1/checkpoint-428/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e02fdb1e8930d0fc3489386465b2180991e69247221cc87c1151b1dbd15512a
 size 535727290

 version https://git-lfs.github.com/spec/v1
+oid sha256:624048ea325833af4406b91a77aff9ea3a950e331a071f74b3e4f6b95cfcf247
 size 535727290

run-1/checkpoint-428/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e87fe3c36d691ac6c42bca874c74ed014eefdbb6108564f8658fb9e5b9febc83
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:867e6927868191a86d6db7d56005075d31f36d251a9b673c6fbf57cd16a9a13b
+size 14308

run-1/checkpoint-428/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c25e2e9cf1ce0cd951d12d306061617bdab3f567ca512f75957cae4f113da48
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:55c9e244759cfc5447e2d2baa3725a9d460f6bb44cd1fbe697b437b2cb21c49a
 size 1064

run-1/checkpoint-428/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.3005246361638528,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
   "epoch": 2.0,
   "eval_steps": 500,
@@ -10,35 +10,35 @@
   "log_history": [
     {
       "epoch": 1.0,
-      "eval_loss": 0.6478912234306335,
-      "eval_matthews_correlation": 0.18118799119487816,
-      "eval_runtime": 0.7571,
-      "eval_samples_per_second": 1377.58,
-      "eval_steps_per_second": 87.172,
       "step": 214
     },
     {
       "epoch": 2.0,
-      "eval_loss": 0.9094101190567017,
-      "eval_matthews_correlation": 0.3005246361638528,
-      "eval_runtime": 1.0485,
-      "eval_samples_per_second": 994.768,
-      "eval_steps_per_second": 62.948,
       "step": 428
     }
   ],
   "logging_steps": 500,
-  "max_steps": 428,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 2,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
-    "learning_rate": 3.45845102664945e-05,
-    "num_train_epochs": 2,
     "per_device_train_batch_size": 4,
-    "seed": 15
   }
 }

 {
+  "best_metric": 0.3019091863081111,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
   "epoch": 2.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 1.0,
+      "eval_loss": 0.5719716548919678,
+      "eval_matthews_correlation": 0.0835915715371112,
+      "eval_runtime": 0.6978,
+      "eval_samples_per_second": 1494.771,
+      "eval_steps_per_second": 94.588,
       "step": 214
     },
     {
       "epoch": 2.0,
+      "eval_loss": 1.0430289506912231,
+      "eval_matthews_correlation": 0.3019091863081111,
+      "eval_runtime": 0.7554,
+      "eval_samples_per_second": 1380.773,
+      "eval_steps_per_second": 87.374,
       "step": 428
     }
   ],
   "logging_steps": 500,
+  "max_steps": 642,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
+    "learning_rate": 3.5027277138406044e-05,
+    "num_train_epochs": 3,
     "per_device_train_batch_size": 4,
+    "seed": 29
   }
 }

run-1/checkpoint-428/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f8bfed4abe7904aebfa29146a26419ad532e218a199dc08365bb4ca5a35eafdb
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:824c97682d0b5180a58b29aad975f1f670351c62a61736d4bcfd4286ecc497ee
 size 4984

runs/Feb28_19-52-39_5620ed9b2fff/events.out.tfevents.1709150660.5620ed9b2fff.209.20 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95a3c369dad2af8305d3091c29b46840702809cd76412bb48f4838eb06fee7fa
+size 6112

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f6d1731c3abac75809f54a97ff9d481250d1b24fb289e39c839a834b6e1e5222
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:824c97682d0b5180a58b29aad975f1f670351c62a61736d4bcfd4286ecc497ee
 size 4984