SjardiWillems commited on Mar 5, 2024

Commit

b968bcd

verified ·

1 Parent(s): d53c5c8

Training in progress, epoch 1

Browse files

Files changed (47) hide show

model.safetensors +1 -1
run-4/checkpoint-108/config.json +25 -0
run-4/checkpoint-108/model.safetensors +3 -0
run-4/checkpoint-108/optimizer.pt +3 -0
run-4/checkpoint-108/rng_state.pth +3 -0
run-4/checkpoint-108/scheduler.pt +3 -0
run-4/checkpoint-108/special_tokens_map.json +7 -0
run-4/checkpoint-108/tokenizer.json +0 -0
run-4/checkpoint-108/tokenizer_config.json +55 -0
run-4/checkpoint-108/trainer_state.json +44 -0
run-4/checkpoint-108/training_args.bin +3 -0
run-4/checkpoint-108/vocab.txt +0 -0
run-4/checkpoint-162/config.json +25 -0
run-4/checkpoint-162/model.safetensors +3 -0
run-4/checkpoint-162/optimizer.pt +3 -0
run-4/checkpoint-162/rng_state.pth +3 -0
run-4/checkpoint-162/scheduler.pt +3 -0
run-4/checkpoint-162/special_tokens_map.json +7 -0
run-4/checkpoint-162/tokenizer.json +0 -0
run-4/checkpoint-162/tokenizer_config.json +55 -0
run-4/checkpoint-162/trainer_state.json +53 -0
run-4/checkpoint-162/training_args.bin +3 -0
run-4/checkpoint-162/vocab.txt +0 -0
run-4/checkpoint-216/config.json +25 -0
run-4/checkpoint-216/model.safetensors +3 -0
run-4/checkpoint-216/optimizer.pt +3 -0
run-4/checkpoint-216/rng_state.pth +3 -0
run-4/checkpoint-216/scheduler.pt +3 -0
run-4/checkpoint-216/special_tokens_map.json +7 -0
run-4/checkpoint-216/tokenizer.json +0 -0
run-4/checkpoint-216/tokenizer_config.json +55 -0
run-4/checkpoint-216/trainer_state.json +62 -0
run-4/checkpoint-216/training_args.bin +3 -0
run-4/checkpoint-216/vocab.txt +0 -0
run-5/checkpoint-107/config.json +25 -0
run-5/checkpoint-107/model.safetensors +3 -0
run-5/checkpoint-107/optimizer.pt +3 -0
run-5/checkpoint-107/rng_state.pth +3 -0
run-5/checkpoint-107/scheduler.pt +3 -0
run-5/checkpoint-107/special_tokens_map.json +7 -0
run-5/checkpoint-107/tokenizer.json +0 -0
run-5/checkpoint-107/tokenizer_config.json +55 -0
run-5/checkpoint-107/trainer_state.json +35 -0
run-5/checkpoint-107/training_args.bin +3 -0
run-5/checkpoint-107/vocab.txt +0 -0
runs/Mar05_22-12-34_418b5b5ae03a/events.out.tfevents.1709677185.418b5b5ae03a.490.7 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02862714de993ef37f27e3368f59c2a27353cbade9b451ae7a7827c2a8b05f06
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:5405b3f0bc690acb5e72d8572bb2ab62892d313bbd5164d479dc89393c90522c
 size 267832560

run-4/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-4/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b32b2098f1978fae096499d0e4ea75993971c8cb014709e9800eed76243f85f7
+size 267832560

run-4/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d274d7de9fc8010463014c6fbe9d9bd09e89cea678ab2df7c54c6c79da225d26
+size 535727290

run-4/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee7e60f79ad03e7883c079c1f85495a981d3be8767293cdfbe55f08a3528f0ec
+size 14244

run-4/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc496dec6453ccf31569df2947b352c5714d0b8b9fbaf79982d848df2dbccbdb
+size 1064

run-4/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-54",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6176753640174866,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4943,
+      "eval_samples_per_second": 2110.017,
+      "eval_steps_per_second": 133.52,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6119449734687805,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4986,
+      "eval_samples_per_second": 2091.885,
+      "eval_steps_per_second": 132.372,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.417181244756343e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 16,
+    "seed": 2
+  }
+}

run-4/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3928c16c02505fbafd2b613f04e198971dff973ed26c136be7ae0be8c95ef703
+size 4984

run-4/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-162/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-4/checkpoint-162/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:079f17b5f388b8cea96e25ae7ad797174210fe8e467dcf40882e5deb4ec752c0
+size 267832560

run-4/checkpoint-162/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ca0eff644d08b148a1be55952038d61186dc2405d3faa86ae85f475046d19f5
+size 535727290

run-4/checkpoint-162/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3065039ef3f12043ba4ac718f8e8557de93e86115ec7539c965ca687dfb38259
+size 14244

run-4/checkpoint-162/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8a1402a31c31d75a4ff4384b2387d50a1ae106a25bb9c93324f9295254d3df9
+size 1064

run-4/checkpoint-162/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-162/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-162/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-162/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-54",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 162,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6176753640174866,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4943,
+      "eval_samples_per_second": 2110.017,
+      "eval_steps_per_second": 133.52,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6119449734687805,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4986,
+      "eval_samples_per_second": 2091.885,
+      "eval_steps_per_second": 132.372,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.608396589756012,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5,
+      "eval_samples_per_second": 2086.175,
+      "eval_steps_per_second": 132.011,
+      "step": 162
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.417181244756343e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 16,
+    "seed": 2
+  }
+}

run-4/checkpoint-162/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3928c16c02505fbafd2b613f04e198971dff973ed26c136be7ae0be8c95ef703
+size 4984

run-4/checkpoint-162/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-216/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-4/checkpoint-216/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45c1554230c4ba82af03c693a04a02f95d9a79d7399b8b8a728025a28a654e6a
+size 267832560

run-4/checkpoint-216/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d96836243d4e100d0b913df19ea2a58b924fc420eb831d1fc13077967e85263d
+size 535727290

run-4/checkpoint-216/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:549efac80955166702d656a376df45a74f203f1f0a38fdbc0f5e0a62c71685a0
+size 14244

run-4/checkpoint-216/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d46a262ce8a845e8459adfc789b16b04777aeb4b7a62a122800e6594ef2670a8
+size 1064

run-4/checkpoint-216/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-216/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-216/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-216/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-54",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 216,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6176753640174866,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4943,
+      "eval_samples_per_second": 2110.017,
+      "eval_steps_per_second": 133.52,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6119449734687805,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4986,
+      "eval_samples_per_second": 2091.885,
+      "eval_steps_per_second": 132.372,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.608396589756012,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.5,
+      "eval_samples_per_second": 2086.175,
+      "eval_steps_per_second": 132.011,
+      "step": 162
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6073262691497803,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4975,
+      "eval_samples_per_second": 2096.331,
+      "eval_steps_per_second": 132.654,
+      "step": 216
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.417181244756343e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 16,
+    "seed": 2
+  }
+}

run-4/checkpoint-216/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3928c16c02505fbafd2b613f04e198971dff973ed26c136be7ae0be8c95ef703
+size 4984

run-4/checkpoint-216/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-5/checkpoint-107/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "vocab_size": 30522
+}

run-5/checkpoint-107/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5405b3f0bc690acb5e72d8572bb2ab62892d313bbd5164d479dc89393c90522c
+size 267832560

run-5/checkpoint-107/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f189c01a54c688d37fb6a62212d52f2baaa3da35bf1525b2e4b77398850c05df
+size 535727290

run-5/checkpoint-107/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15704b81217fbb058fc44280ba7055ee6fb9d4b79ec4940ec066d50c4134ceb6
+size 14244

run-5/checkpoint-107/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75575dabb9dd2635675316e2564ba84f4817325682d84b02a8b5870800c2a215
+size 1064

run-5/checkpoint-107/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-107/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-5/checkpoint-107/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-107/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-5/checkpoint-107",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 107,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5872147679328918,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.4953,
+      "eval_samples_per_second": 2105.738,
+      "eval_steps_per_second": 133.249,
+      "step": 107
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 428,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.3532603647862407e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 8,
+    "seed": 39
+  }
+}

run-5/checkpoint-107/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8bbb62e7b6ea76b58f3ba9c9316f93ea5221fba36315ac9f237a40d72a4bfca
+size 4984

run-5/checkpoint-107/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Mar05_22-12-34_418b5b5ae03a/events.out.tfevents.1709677185.418b5b5ae03a.490.7 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:771a40b73ebc5375b186dbbd5f2c09908cb451d6209bc0219bba55b8fb1a10d3
+size 6230

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3928c16c02505fbafd2b613f04e198971dff973ed26c136be7ae0be8c95ef703
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8bbb62e7b6ea76b58f3ba9c9316f93ea5221fba36315ac9f237a40d72a4bfca
 size 4984