Training in progress, epoch 2

Files changed (11) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef12c4c560830a70915ed8990bd15246b45cd4cede20136292a3713df20d7f38
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a7ae91360481ab1aead09d557d58d1b42a726caf7a77a9bf10bee6acbb84e11
 size 267832560

run-0/checkpoint-268/config.json CHANGED Viewed

@@ -20,6 +20,6 @@
   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.38.2",
   "vocab_size": 30522
 }

   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.40.0",
   "vocab_size": 30522
 }

run-0/checkpoint-268/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50b00da9b88c63da26861699eb35b54804a1a5d446a9c579c44ba575cc6e5839
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a7ae91360481ab1aead09d557d58d1b42a726caf7a77a9bf10bee6acbb84e11
 size 267832560

run-0/checkpoint-268/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f3c921fa31b6bf63969ca37245eea6b4fffb137d74dcd041f9c60ccd5e671056
 size 535724410

 version https://git-lfs.github.com/spec/v1
+oid sha256:e36d2c78b2d43a012843b07013247032c4258abd6bff2336658df8ff1338cde8
 size 535724410

run-0/checkpoint-268/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:71a648ba44ab0f8aad220b8a1dd63144a108690234e45a733e0e861c48c570d1
 size 13990

 version https://git-lfs.github.com/spec/v1
+oid sha256:40392f19c38e19bfbfcebe085910b1abec4b89b63722fd76161650b6b9ab4f74
 size 13990

run-0/checkpoint-268/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1586e250c0804dd1701f6acc583b509801d53f57ef9d8d782491154daa9649d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6e9b4c10b2fe900a0592868e9e260872a8150c34e046a0a406aae783984c67e
 size 1064

run-0/checkpoint-268/tokenizer.json CHANGED Viewed

@@ -1,11 +1,6 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 512,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

run-0/checkpoint-268/tokenizer_config.json CHANGED Viewed

@@ -45,7 +45,7 @@
   "cls_token": "[CLS]",
   "do_lower_case": true,
   "mask_token": "[MASK]",
-  "model_max_length": 512,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,

   "cls_token": "[CLS]",
   "do_lower_case": true,
   "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,

run-0/checkpoint-268/trainer_state.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
-  "best_metric": 0.45744157534977586,
-  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-268",
-  "epoch": 1.0,
   "eval_steps": 500,
   "global_step": 268,
   "is_hyper_param_search": true,
@@ -10,26 +10,35 @@
   "log_history": [
     {
       "epoch": 1.0,
-      "eval_loss": 0.4704936742782593,
-      "eval_matthews_correlation": 0.45744157534977586,
-      "eval_runtime": 30.3484,
-      "eval_samples_per_second": 34.367,
-      "eval_steps_per_second": 2.175,
       "step": 268
     }
   ],
   "logging_steps": 500,
-  "max_steps": 536,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
   "total_flos": 0,
-  "train_batch_size": 32,
   "trial_name": null,
   "trial_params": {
-    "learning_rate": 9.01334118373162e-05,
     "num_train_epochs": 2,
-    "per_device_train_batch_size": 32,
-    "seed": 1
   }
 }

 {
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-134",
+  "epoch": 2.0,
   "eval_steps": 500,
   "global_step": 268,
   "is_hyper_param_search": true,
   "log_history": [
     {
       "epoch": 1.0,
+      "eval_loss": 0.5772179365158081,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 28.4405,
+      "eval_samples_per_second": 36.673,
+      "eval_steps_per_second": 2.321,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5522039532661438,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 29.7327,
+      "eval_samples_per_second": 35.079,
+      "eval_steps_per_second": 2.22,
       "step": 268
     }
   ],
   "logging_steps": 500,
+  "max_steps": 268,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
   "total_flos": 0,
+  "train_batch_size": 64,
   "trial_name": null,
   "trial_params": {
+    "learning_rate": 6.016083409160101e-06,
     "num_train_epochs": 2,
+    "per_device_train_batch_size": 64,
+    "seed": 6
   }
 }

run-0/checkpoint-268/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9e68dcaeaaa7b85726310fa2d1d977e77e5a2fd412333729b7b500e3b6fc5de5
-size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:de6e654bc5562972689e528d7506196f0ff109bd86fc3e0cc344b82d96435ef0
+size 5048

runs/Apr23_13-58-51_309eb7d6022b/events.out.tfevents.1713886483.309eb7d6022b.9612.2 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5654a81b4d4920d79bc9bf7da087b1dfdff6be20f81dcf8a07763ea82e18138
-size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:3906461454f9b112af0d41fc6222c06cf8da549a78953ab46f65f1cd96bf24e7
+size 5673