azliza794 commited on Oct 2, 2024

Commit

5cee664

verified ·

1 Parent(s): 39ec58a

Training in progress, epoch 1

Browse files

Files changed (48) hide show

model.safetensors +1 -1
run-8/checkpoint-402/config.json +25 -0
run-8/checkpoint-402/model.safetensors +3 -0
run-8/checkpoint-402/optimizer.pt +3 -0
run-8/checkpoint-402/rng_state.pth +3 -0
run-8/checkpoint-402/scheduler.pt +3 -0
run-8/checkpoint-402/special_tokens_map.json +7 -0
run-8/checkpoint-402/tokenizer.json +0 -0
run-8/checkpoint-402/tokenizer_config.json +55 -0
run-8/checkpoint-402/trainer_state.json +56 -0
run-8/checkpoint-402/training_args.bin +3 -0
run-8/checkpoint-402/vocab.txt +0 -0
run-9/checkpoint-134/config.json +25 -0
run-9/checkpoint-134/model.safetensors +3 -0
run-9/checkpoint-134/optimizer.pt +3 -0
run-9/checkpoint-134/rng_state.pth +3 -0
run-9/checkpoint-134/scheduler.pt +3 -0
run-9/checkpoint-134/special_tokens_map.json +7 -0
run-9/checkpoint-134/tokenizer.json +0 -0
run-9/checkpoint-134/tokenizer_config.json +55 -0
run-9/checkpoint-134/trainer_state.json +47 -0
run-9/checkpoint-134/training_args.bin +3 -0
run-9/checkpoint-134/vocab.txt +0 -0
run-9/checkpoint-268/config.json +25 -0
run-9/checkpoint-268/model.safetensors +3 -0
run-9/checkpoint-268/optimizer.pt +3 -0
run-9/checkpoint-268/rng_state.pth +3 -0
run-9/checkpoint-268/scheduler.pt +3 -0
run-9/checkpoint-268/special_tokens_map.json +7 -0
run-9/checkpoint-268/tokenizer.json +0 -0
run-9/checkpoint-268/tokenizer_config.json +55 -0
run-9/checkpoint-268/trainer_state.json +56 -0
run-9/checkpoint-268/training_args.bin +3 -0
run-9/checkpoint-268/vocab.txt +0 -0
run-9/checkpoint-402/config.json +25 -0
run-9/checkpoint-402/model.safetensors +3 -0
run-9/checkpoint-402/optimizer.pt +3 -0
run-9/checkpoint-402/rng_state.pth +3 -0
run-9/checkpoint-402/scheduler.pt +3 -0
run-9/checkpoint-402/special_tokens_map.json +7 -0
run-9/checkpoint-402/tokenizer.json +0 -0
run-9/checkpoint-402/tokenizer_config.json +55 -0
run-9/checkpoint-402/trainer_state.json +56 -0
run-9/checkpoint-402/training_args.bin +3 -0
run-9/checkpoint-402/vocab.txt +0 -0
runs/Oct02_05-18-55_0fd1839bafe2/events.out.tfevents.1727849344.0fd1839bafe2.228.11 +3 -0
runs/Oct02_05-18-55_0fd1839bafe2/events.out.tfevents.1727849716.0fd1839bafe2.228.12 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:433dbd856696ab5af5f01b46b96262dee0ca5aee252df96b0354eeafa9a8fee5
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:37b4ebc6ca65f593e216669994f47a9363ce75bc9f71073bffb3783be94bb86c
 size 267832560

run-8/checkpoint-402/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-402/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0bb6def054d4a1c0e84bebcb2de5c7d760ffb5cb4dbedd0a5002854c20eb575f
+size 267832560

run-8/checkpoint-402/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c69e2867480bb95fddb19c7d17e1603f0bf80477d7052d525ad0558d16c67f38
+size 535727290

run-8/checkpoint-402/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc48165f96c95e93b770dbf5148fdd3a5a339128077c8062b3cbab3af12210ce
+size 14308

run-8/checkpoint-402/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77300bf1b104feeccda463fc8d3179b8db10406d99745b631fcc47677c65b50d
+size 1064

run-8/checkpoint-402/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-402/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-402/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-402/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": 0.4460777593165835,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-268",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 402,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5172421336174011,
+      "eval_matthews_correlation": 0.3620451783618902,
+      "eval_runtime": 0.8669,
+      "eval_samples_per_second": 1203.157,
+      "eval_steps_per_second": 76.135,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.4833631217479706,
+      "eval_matthews_correlation": 0.4460777593165835,
+      "eval_runtime": 0.7326,
+      "eval_samples_per_second": 1423.789,
+      "eval_steps_per_second": 90.096,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 402,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 7.667924170849842e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 31
+  }
+}

run-8/checkpoint-402/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e62a7389f77de5be444c3f8215f73607c1df8e9ffb6e699c83dce559c0a17abc
+size 5304

run-8/checkpoint-402/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-134/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.1",
+  "vocab_size": 30522
+}

run-9/checkpoint-134/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8520642316417afcd56fa5e0240eeff5d606cdcb022d2448fd1f1e236eded324
+size 267832560

run-9/checkpoint-134/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:758fe1a14a02d8597d99e00b0093bd58907fa86012113b42bd673594b13f3abe
+size 535727290

run-9/checkpoint-134/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88e5ee3b68711c6eef1395eff91faa3ca1316962bb36b4e6e5e949e875db7153
+size 14244

run-9/checkpoint-134/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1097b1cebb1a5260c2121747029e8224d0ef1bf775cf00bc6ab990a02a928d28
+size 1064

run-9/checkpoint-134/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-134/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-134/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-134/trainer_state.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "best_metric": 0.3822545955758537,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-9/checkpoint-134",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 134,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5341776013374329,
+      "eval_matthews_correlation": 0.3822545955758537,
+      "eval_runtime": 0.8953,
+      "eval_samples_per_second": 1164.93,
+      "eval_steps_per_second": 73.716,
+      "step": 134
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 402,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.7092657771935757e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 3
+  }
+}

run-9/checkpoint-134/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d559ab9ea359d9c7451385758a914c6a7bf2aa72f17ac557fb59939b00e8404
+size 5304

run-9/checkpoint-134/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-268/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.1",
+  "vocab_size": 30522
+}

run-9/checkpoint-268/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:120abed89f7ed43062156f57b65a4fb864c0c56e4d0b9d2bc4a5901b20b92c9f
+size 267832560

run-9/checkpoint-268/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66d5eeabfe9a9a9913d12900fae0ce75129791761c379370a72571f2caa95e4a
+size 535727290

run-9/checkpoint-268/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a71d2a8aa30cd6a3948bc1ce49f6cec4f98911a38087f54d74a4721d266cccb1
+size 14244

run-9/checkpoint-268/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c8e20ba0589c6b7921e201a0384356f7ed2be105bc5b8ae994cd354dd2c9334
+size 1064

run-9/checkpoint-268/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-268/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-268/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-268/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": 0.4411030676126281,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-9/checkpoint-268",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 268,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5341776013374329,
+      "eval_matthews_correlation": 0.3822545955758537,
+      "eval_runtime": 0.8953,
+      "eval_samples_per_second": 1164.93,
+      "eval_steps_per_second": 73.716,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5112224221229553,
+      "eval_matthews_correlation": 0.4411030676126281,
+      "eval_runtime": 0.83,
+      "eval_samples_per_second": 1256.671,
+      "eval_steps_per_second": 79.521,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 402,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.7092657771935757e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 3
+  }
+}

run-9/checkpoint-268/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d559ab9ea359d9c7451385758a914c6a7bf2aa72f17ac557fb59939b00e8404
+size 5304

run-9/checkpoint-268/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-402/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.1",
+  "vocab_size": 30522
+}

run-9/checkpoint-402/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da528bf64d937f12f4322f9b066de1e550074e3bfb9efecc00910c65ccd3b00f
+size 267832560

run-9/checkpoint-402/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:312bd3b6a54716469aa9fbbccb57e521f47086d90d1400a1d40375d4c1ebc0d0
+size 535727290

run-9/checkpoint-402/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be5217733de84a5068ad82abb6a0d40288cb7a2205bf7835f2608eebf21ae9ed
+size 14244

run-9/checkpoint-402/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:edf35d2a4fa0e0cf004a3df8552420a503ce8162631bc842b51a31e8f8286afc
+size 1064

run-9/checkpoint-402/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-402/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-402/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-402/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": 0.4411030676126281,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-9/checkpoint-268",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 402,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5341776013374329,
+      "eval_matthews_correlation": 0.3822545955758537,
+      "eval_runtime": 0.8953,
+      "eval_samples_per_second": 1164.93,
+      "eval_steps_per_second": 73.716,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5112224221229553,
+      "eval_matthews_correlation": 0.4411030676126281,
+      "eval_runtime": 0.83,
+      "eval_samples_per_second": 1256.671,
+      "eval_steps_per_second": 79.521,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 402,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.7092657771935757e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 3
+  }
+}

run-9/checkpoint-402/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d559ab9ea359d9c7451385758a914c6a7bf2aa72f17ac557fb59939b00e8404
+size 5304

run-9/checkpoint-402/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Oct02_05-18-55_0fd1839bafe2/events.out.tfevents.1727849344.0fd1839bafe2.228.11 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65742650e4e37b21b1431d1a00668f7c95953175572e2c95b5758ca6fda1c685
+size 5931

runs/Oct02_05-18-55_0fd1839bafe2/events.out.tfevents.1727849716.0fd1839bafe2.228.12 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32638ef521f4c7465a432732f6bc766023c48b8e989e56683e6f1e29e81d9006
+size 8307

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e62a7389f77de5be444c3f8215f73607c1df8e9ffb6e699c83dce559c0a17abc
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:3becf80cdc9221d5701481d18740c6b71586a42ea3a6944468cdacaf47dd2b83
 size 5304