anamelchor commited on Feb 27, 2024

Commit

aaa50b7

verified ·

1 Parent(s): 5f4d427

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-3/checkpoint-28/config.json +25 -0
run-3/checkpoint-28/model.safetensors +3 -0
run-3/checkpoint-28/optimizer.pt +3 -0
run-3/checkpoint-28/rng_state.pth +3 -0
run-3/checkpoint-28/scheduler.pt +3 -0
run-3/checkpoint-28/special_tokens_map.json +7 -0
run-3/checkpoint-28/tokenizer.json +0 -0
run-3/checkpoint-28/tokenizer_config.json +55 -0
run-3/checkpoint-28/trainer_state.json +44 -0
run-3/checkpoint-28/training_args.bin +3 -0
run-3/checkpoint-28/vocab.txt +0 -0
run-3/checkpoint-42/config.json +25 -0
run-3/checkpoint-42/model.safetensors +3 -0
run-3/checkpoint-42/optimizer.pt +3 -0
run-3/checkpoint-42/rng_state.pth +3 -0
run-3/checkpoint-42/scheduler.pt +3 -0
run-3/checkpoint-42/special_tokens_map.json +7 -0
run-3/checkpoint-42/tokenizer.json +0 -0
run-3/checkpoint-42/tokenizer_config.json +55 -0
run-3/checkpoint-42/trainer_state.json +53 -0
run-3/checkpoint-42/training_args.bin +3 -0
run-3/checkpoint-42/vocab.txt +0 -0
run-3/checkpoint-56/config.json +25 -0
run-3/checkpoint-56/model.safetensors +3 -0
run-3/checkpoint-56/optimizer.pt +3 -0
run-3/checkpoint-56/rng_state.pth +3 -0
run-3/checkpoint-56/scheduler.pt +3 -0
run-3/checkpoint-56/special_tokens_map.json +7 -0
run-3/checkpoint-56/tokenizer.json +0 -0
run-3/checkpoint-56/tokenizer_config.json +55 -0
run-3/checkpoint-56/trainer_state.json +62 -0
run-3/checkpoint-56/training_args.bin +3 -0
run-3/checkpoint-56/vocab.txt +0 -0
run-3/checkpoint-70/config.json +25 -0
run-3/checkpoint-70/model.safetensors +3 -0
run-3/checkpoint-70/optimizer.pt +3 -0
run-3/checkpoint-70/rng_state.pth +3 -0
run-3/checkpoint-70/scheduler.pt +3 -0
run-3/checkpoint-70/special_tokens_map.json +7 -0
run-3/checkpoint-70/tokenizer.json +0 -0
run-3/checkpoint-70/tokenizer_config.json +55 -0
run-3/checkpoint-70/trainer_state.json +71 -0
run-3/checkpoint-70/training_args.bin +3 -0
run-3/checkpoint-70/vocab.txt +0 -0
run-4/checkpoint-214/config.json +25 -0
run-4/checkpoint-214/model.safetensors +3 -0
run-4/checkpoint-214/optimizer.pt +3 -0
run-4/checkpoint-214/rng_state.pth +3 -0
run-4/checkpoint-214/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:efd2beb68dea772533b2d8bb10a96dd3c7b1ed66f4471c947aed0e9bedec29f3
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:79865c33c7bf98d3964f5869bc9be96a1a7692de8cbdd2aba029b7fbe1cb6e07
 size 267832560

run-3/checkpoint-28/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-3/checkpoint-28/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a4c23f7593eb4934b1164309772de95ca6b6d7831f4291286a630e4ff1078f84
+size 267832560

run-3/checkpoint-28/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b0c49b19b4b61ccaf2b97c89f7b18aa2a818d5976237066f6e621172928b708
+size 535727290

run-3/checkpoint-28/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5197778b13fdd3d29d0d2bd5a3963b7496971abf30b91e7dc44d73ee41788c0
+size 14308

run-3/checkpoint-28/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e710cde757771fefd84a011ec5c32f0d9b86fd935c81b60d9d6f22717a891d5
+size 1064

run-3/checkpoint-28/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-28/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-28/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-28/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-14",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 28,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6366313099861145,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7373,
+      "eval_samples_per_second": 1414.699,
+      "eval_steps_per_second": 89.521,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198997497558594,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.0022,
+      "eval_samples_per_second": 1040.684,
+      "eval_steps_per_second": 65.853,
+      "step": 28
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 70,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.334111722797918e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 26
+  }
+}

run-3/checkpoint-28/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84cda071733079cd7a9b47f4f85a0441647707f07c937e25d524e4ed794651e0
+size 4984

run-3/checkpoint-28/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-42/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-3/checkpoint-42/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7549dd30d2e0a2c0a9913416641ecaea266302013e81e0181173034b06937379
+size 267832560

run-3/checkpoint-42/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96c6e8b22f3072e365398a65943954476ff44270d55c68ef439c1b591734632c
+size 535727290

run-3/checkpoint-42/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8aee0423b713ff809894b32709ebeb6f8710ef6f4c28e9ad365ac10810557ea8
+size 14308

run-3/checkpoint-42/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:380a42d523b328eeb1b25d754840084cf24eb63d32a870a268852280598150c8
+size 1064

run-3/checkpoint-42/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-42/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-42/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-42/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-14",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 42,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6366313099861145,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7373,
+      "eval_samples_per_second": 1414.699,
+      "eval_steps_per_second": 89.521,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198997497558594,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.0022,
+      "eval_samples_per_second": 1040.684,
+      "eval_steps_per_second": 65.853,
+      "step": 28
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6155935525894165,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8197,
+      "eval_samples_per_second": 1272.398,
+      "eval_steps_per_second": 80.516,
+      "step": 42
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 70,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.334111722797918e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 26
+  }
+}

run-3/checkpoint-42/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84cda071733079cd7a9b47f4f85a0441647707f07c937e25d524e4ed794651e0
+size 4984

run-3/checkpoint-42/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-56/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-3/checkpoint-56/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd9a1d9cbf6cefce58555b0aa62d8e91637c69c3fc35e0fa4fe439fc319218d4
+size 267832560

run-3/checkpoint-56/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:902167f289883e9fd9938667f1d91e586d3888c295d24d60945cd70ef44cc5f4
+size 535727290

run-3/checkpoint-56/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:750f694db3d10a6c5fed7d99f05860add502bab90dc60863cc62f7998f1feece
+size 14308

run-3/checkpoint-56/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c276c379069e6d4ac21c21f6e3859d4daa8334876bed7a7b71044dae954a1c7a
+size 1064

run-3/checkpoint-56/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-56/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-56/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-56/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-14",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 56,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6366313099861145,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7373,
+      "eval_samples_per_second": 1414.699,
+      "eval_steps_per_second": 89.521,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198997497558594,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.0022,
+      "eval_samples_per_second": 1040.684,
+      "eval_steps_per_second": 65.853,
+      "step": 28
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6155935525894165,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8197,
+      "eval_samples_per_second": 1272.398,
+      "eval_steps_per_second": 80.516,
+      "step": 42
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6139842867851257,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.3039,
+      "eval_samples_per_second": 799.914,
+      "eval_steps_per_second": 50.618,
+      "step": 56
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 70,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.334111722797918e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 26
+  }
+}

run-3/checkpoint-56/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84cda071733079cd7a9b47f4f85a0441647707f07c937e25d524e4ed794651e0
+size 4984

run-3/checkpoint-56/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-70/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-3/checkpoint-70/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5bb5ac8b6a225ce78056ab9aa184b2154c52d6e41f9a85cb66791f115ec72808
+size 267832560

run-3/checkpoint-70/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:517192997b8d61063ee18d074f75c32cb609d1d3999582931831a2eb3fe1c499
+size 535727290

run-3/checkpoint-70/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23213bbe82e85687c90ba47be5f41fb4d68f40a5101140cb33703aa57880ba62
+size 14308

run-3/checkpoint-70/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aa0dc4d9dc14db9e1e9ef54adb977fc723cff0aa8e8f652c47ae7bd18628f173
+size 1064

run-3/checkpoint-70/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-70/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-70/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-70/trainer_state.json ADDED Viewed

	@@ -0,0 +1,71 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-14",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 70,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6366313099861145,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7373,
+      "eval_samples_per_second": 1414.699,
+      "eval_steps_per_second": 89.521,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198997497558594,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.0022,
+      "eval_samples_per_second": 1040.684,
+      "eval_steps_per_second": 65.853,
+      "step": 28
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6155935525894165,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8197,
+      "eval_samples_per_second": 1272.398,
+      "eval_steps_per_second": 80.516,
+      "step": 42
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6139842867851257,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.3039,
+      "eval_samples_per_second": 799.914,
+      "eval_steps_per_second": 50.618,
+      "step": 56
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.6134741902351379,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7992,
+      "eval_samples_per_second": 1305.091,
+      "eval_steps_per_second": 82.585,
+      "step": 70
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 70,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.334111722797918e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 26
+  }
+}

run-3/checkpoint-70/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84cda071733079cd7a9b47f4f85a0441647707f07c937e25d524e4ed794651e0
+size 4984

run-3/checkpoint-70/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-214/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-214/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:79865c33c7bf98d3964f5869bc9be96a1a7692de8cbdd2aba029b7fbe1cb6e07
+size 267832560

run-4/checkpoint-214/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff1ea5ded670af376725e114d16f1ae0b69b4a53bca2151723eb440dfddaa3e5
+size 535727290

run-4/checkpoint-214/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0393392c4b01959d556c154618c731ff987a15e47201ae9d681c00e65e98ae7c
+size 14244

run-4/checkpoint-214/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e83c989bc9c0e6b812550c6b94b7801888f834a9423e8e8eb9f846c2d59f526d
+size 1064