Zeid-Hazboun commited on Feb 27

Commit

3b162f6

•

1 Parent(s): b91a83e

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-1/checkpoint-107/config.json +25 -0
run-1/checkpoint-107/model.safetensors +3 -0
run-1/checkpoint-107/optimizer.pt +3 -0
run-1/checkpoint-107/rng_state.pth +3 -0
run-1/checkpoint-107/scheduler.pt +3 -0
run-1/checkpoint-107/special_tokens_map.json +7 -0
run-1/checkpoint-107/tokenizer.json +0 -0
run-1/checkpoint-107/tokenizer_config.json +55 -0
run-1/checkpoint-107/trainer_state.json +35 -0
run-1/checkpoint-107/training_args.bin +3 -0
run-1/checkpoint-107/vocab.txt +0 -0
run-1/checkpoint-214/config.json +25 -0
run-1/checkpoint-214/model.safetensors +3 -0
run-1/checkpoint-214/optimizer.pt +3 -0
run-1/checkpoint-214/rng_state.pth +3 -0
run-1/checkpoint-214/scheduler.pt +3 -0
run-1/checkpoint-214/special_tokens_map.json +7 -0
run-1/checkpoint-214/tokenizer.json +0 -0
run-1/checkpoint-214/tokenizer_config.json +55 -0
run-1/checkpoint-214/trainer_state.json +44 -0
run-1/checkpoint-214/training_args.bin +3 -0
run-1/checkpoint-214/vocab.txt +0 -0
run-1/checkpoint-321/config.json +25 -0
run-1/checkpoint-321/model.safetensors +3 -0
run-1/checkpoint-321/optimizer.pt +3 -0
run-1/checkpoint-321/rng_state.pth +3 -0
run-1/checkpoint-321/scheduler.pt +3 -0
run-1/checkpoint-321/special_tokens_map.json +7 -0
run-1/checkpoint-321/tokenizer.json +0 -0
run-1/checkpoint-321/tokenizer_config.json +55 -0
run-1/checkpoint-321/trainer_state.json +53 -0
run-1/checkpoint-321/training_args.bin +3 -0
run-1/checkpoint-321/vocab.txt +0 -0
run-2/checkpoint-14/config.json +25 -0
run-2/checkpoint-14/model.safetensors +3 -0
run-2/checkpoint-14/optimizer.pt +3 -0
run-2/checkpoint-14/rng_state.pth +3 -0
run-2/checkpoint-14/scheduler.pt +3 -0
run-2/checkpoint-14/special_tokens_map.json +7 -0
run-2/checkpoint-14/tokenizer.json +0 -0
run-2/checkpoint-14/tokenizer_config.json +55 -0
run-2/checkpoint-14/trainer_state.json +35 -0
run-2/checkpoint-14/training_args.bin +3 -0
run-2/checkpoint-14/vocab.txt +0 -0
run-2/checkpoint-28/config.json +25 -0
run-2/checkpoint-28/model.safetensors +3 -0
run-2/checkpoint-28/optimizer.pt +3 -0
run-2/checkpoint-28/rng_state.pth +3 -0
run-2/checkpoint-28/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ca0b1b801c40be6a525b81a9af56db68a1cc672fbfb011a1c7da80ab03f18e9
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:3cad3bec39311015119b7dfa375dc1421ffe9b0de1ad0cbb90bdd9aa8c739653
 size 267832560

run-1/checkpoint-107/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-107/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ca0b1b801c40be6a525b81a9af56db68a1cc672fbfb011a1c7da80ab03f18e9
+size 267832560

run-1/checkpoint-107/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e641822856615d668286a16f3753eb1cac4f5017582a4f968f69726934da5725
+size 535727290

run-1/checkpoint-107/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6909052d85ee621eecfd2de5b2f6c99a2d10ff45d4caefd2624110948becd6f
+size 14244

run-1/checkpoint-107/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b1269a877d3445f5906de1e5c5dbf735b83fd09712508e63aa0618cba3a10a7
+size 1064

run-1/checkpoint-107/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-107/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-107/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-107/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-107",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 107,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6317693591117859,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7452,
+      "eval_samples_per_second": 1399.54,
+      "eval_steps_per_second": 88.561,
+      "step": 107
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 321,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.2269041175221473e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 8,
+    "seed": 36
+  }
+}

run-1/checkpoint-107/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2c771799c3f0c612775b9f3264f31c5777a05f5e58949ae6ad028acb911faaf
+size 4984

run-1/checkpoint-107/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-214/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-214/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:939cc862c6413de1d943a89926f717620b26c299f593388da1e57bdc9074a676
+size 267832560

run-1/checkpoint-214/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e4742abde3e572ac0a6f2067df9d9cc336f0f7eb7796df07c22caf4610175304
+size 535727290

run-1/checkpoint-214/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24b398d61f9a9a70156790ad37f97ebcda7584a5a868a19531fa182c6753c585
+size 14244

run-1/checkpoint-214/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:103da5c6d13650d48bb934a1cdf134b4337d2f761d642dcad0452070a9ba7271
+size 1064

run-1/checkpoint-214/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-214/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-214/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-214/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-107",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 214,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6317693591117859,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7452,
+      "eval_samples_per_second": 1399.54,
+      "eval_steps_per_second": 88.561,
+      "step": 107
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198475360870361,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8043,
+      "eval_samples_per_second": 1296.837,
+      "eval_steps_per_second": 82.063,
+      "step": 214
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 321,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.2269041175221473e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 8,
+    "seed": 36
+  }
+}

run-1/checkpoint-214/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2c771799c3f0c612775b9f3264f31c5777a05f5e58949ae6ad028acb911faaf
+size 4984

run-1/checkpoint-214/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-321/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-321/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb24184aa47d27da3d2e9e618995b04df5672fc47616c4edd0b5290863cb6270
+size 267832560

run-1/checkpoint-321/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:786879dd08f86502d6c80f59e1ad4d8d96b6d2becfb3ee1c868921d95a5b98e4
+size 535727290

run-1/checkpoint-321/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0d05e1e8167080c5a20dc474f203256599f9865345b13ebb967873354e8e56c
+size 14244

run-1/checkpoint-321/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c689f74e6356963e51eb9551234fb917f328a3dc14ccded60406115562531fc
+size 1064

run-1/checkpoint-321/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-321/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-321/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-321/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-107",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 321,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6317693591117859,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7452,
+      "eval_samples_per_second": 1399.54,
+      "eval_steps_per_second": 88.561,
+      "step": 107
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6198475360870361,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8043,
+      "eval_samples_per_second": 1296.837,
+      "eval_steps_per_second": 82.063,
+      "step": 214
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.617213249206543,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.9427,
+      "eval_samples_per_second": 1106.398,
+      "eval_steps_per_second": 70.012,
+      "step": 321
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 321,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.2269041175221473e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 8,
+    "seed": 36
+  }
+}

run-1/checkpoint-321/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2c771799c3f0c612775b9f3264f31c5777a05f5e58949ae6ad028acb911faaf
+size 4984

run-1/checkpoint-321/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24ada3fa793f9db4c23b904ce5560855be0251bdc4016965f36e31d3f2079d72
+size 267832560

run-2/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3f7114b1b7a3f4027b2598800600d7b37f112b29f207456b980bb02f7f0de0d
+size 535727290

run-2/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e330aee525a109f44cc3bc5d4b1387583b6433498f1e92dc092c5b05018b03ae
+size 14244

run-2/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ed3c4dbd202897fe743a8d623f80612311872de34c4f38686aef607e2bbee91d
+size 1064

run-2/checkpoint-14/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-14/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-14/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-14/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-14",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 14,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6202465295791626,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7368,
+      "eval_samples_per_second": 1415.551,
+      "eval_steps_per_second": 89.575,
+      "step": 14
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 42,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.681061904439251e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 1
+  }
+}

run-2/checkpoint-14/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75e134d7e9584622a3d2e97b29681ed84c6eb2036b2a87a8e4a210e17cb4e9f6
+size 4984

run-2/checkpoint-14/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-28/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-28/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9010bd406e02ee3252d394b933c0a4d9cb1cdc96d8c7ae4a7625f3b82027105d
+size 267832560

run-2/checkpoint-28/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b047c792079dfbf989142d8696048e9a01bfed1843754407616fe41fc203f209
+size 535727290

run-2/checkpoint-28/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2c232c4796b2d264b7aad27a5607016ef3f38da67930315a629ac0bcfd95ce6
+size 14244

run-2/checkpoint-28/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d5a00ed5de0b2c6698ee726a3694e42016023a419a49b18d6e91a2cbb6aff8a
+size 1064