rozasajneen commited on Feb 25

Commit

18d915c

•

1 Parent(s): 6f5bd23

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-4/checkpoint-268/config.json +25 -0
run-4/checkpoint-268/model.safetensors +3 -0
run-4/checkpoint-268/optimizer.pt +3 -0
run-4/checkpoint-268/rng_state.pth +3 -0
run-4/checkpoint-268/scheduler.pt +3 -0
run-4/checkpoint-268/special_tokens_map.json +7 -0
run-4/checkpoint-268/tokenizer.json +0 -0
run-4/checkpoint-268/tokenizer_config.json +55 -0
run-4/checkpoint-268/trainer_state.json +44 -0
run-4/checkpoint-268/training_args.bin +3 -0
run-4/checkpoint-268/vocab.txt +0 -0
run-4/checkpoint-402/config.json +25 -0
run-4/checkpoint-402/model.safetensors +3 -0
run-4/checkpoint-402/optimizer.pt +3 -0
run-4/checkpoint-402/rng_state.pth +3 -0
run-4/checkpoint-402/scheduler.pt +3 -0
run-4/checkpoint-402/special_tokens_map.json +7 -0
run-4/checkpoint-402/tokenizer.json +0 -0
run-4/checkpoint-402/tokenizer_config.json +55 -0
run-4/checkpoint-402/trainer_state.json +53 -0
run-4/checkpoint-402/training_args.bin +3 -0
run-4/checkpoint-402/vocab.txt +0 -0
run-4/checkpoint-536/config.json +25 -0
run-4/checkpoint-536/model.safetensors +3 -0
run-4/checkpoint-536/optimizer.pt +3 -0
run-4/checkpoint-536/rng_state.pth +3 -0
run-4/checkpoint-536/scheduler.pt +3 -0
run-4/checkpoint-536/special_tokens_map.json +7 -0
run-4/checkpoint-536/tokenizer.json +0 -0
run-4/checkpoint-536/tokenizer_config.json +55 -0
run-4/checkpoint-536/trainer_state.json +69 -0
run-4/checkpoint-536/training_args.bin +3 -0
run-4/checkpoint-536/vocab.txt +0 -0
run-4/checkpoint-670/config.json +25 -0
run-4/checkpoint-670/model.safetensors +3 -0
run-4/checkpoint-670/optimizer.pt +3 -0
run-4/checkpoint-670/rng_state.pth +3 -0
run-4/checkpoint-670/scheduler.pt +3 -0
run-4/checkpoint-670/special_tokens_map.json +7 -0
run-4/checkpoint-670/tokenizer.json +0 -0
run-4/checkpoint-670/tokenizer_config.json +55 -0
run-4/checkpoint-670/trainer_state.json +78 -0
run-4/checkpoint-670/training_args.bin +3 -0
run-4/checkpoint-670/vocab.txt +0 -0
run-5/checkpoint-535/config.json +25 -0
run-5/checkpoint-535/model.safetensors +3 -0
run-5/checkpoint-535/optimizer.pt +3 -0
run-5/checkpoint-535/rng_state.pth +3 -0
run-5/checkpoint-535/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81dcf56167d3ef493e90dd0b3fbeffe976cc6b878759517a2e9dc2fa7265350b
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:8f8faef3b23eaff2c363d74cc3e31d0922f626b504dff2127806023ff5ed2cc6
 size 267832560

run-4/checkpoint-268/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-268/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3383a6abb459361735e834015edbdbc4acd3355935f796907d6f9c71946f4736
+size 267832560

run-4/checkpoint-268/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6dc9ca4c79c6d83c2101ab7c78d89d18d9c73b0fae5309186137fb6e9ba3ceb3
+size 535727290

run-4/checkpoint-268/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3555eb631955363a6f962caf400c4cfa9836ed1849798c8d3679002751fa972
+size 14308

run-4/checkpoint-268/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3311b8b574c75d217575c446a4ad24ffe5ac5d62122c21d187e2affdbc895f16
+size 1064

run-4/checkpoint-268/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-268/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-268/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-268/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.4857615494749571,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-268",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 268,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.4793247580528259,
+      "eval_matthews_correlation": 0.41721186495955986,
+      "eval_runtime": 0.7047,
+      "eval_samples_per_second": 1480.003,
+      "eval_steps_per_second": 93.653,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5243192315101624,
+      "eval_matthews_correlation": 0.4857615494749571,
+      "eval_runtime": 0.7767,
+      "eval_samples_per_second": 1342.919,
+      "eval_steps_per_second": 84.979,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 8.359942777903227e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-4/checkpoint-268/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe6e3427aa9b8f76859978c9610153c5ea040a7b3849026173b26b4eb6e25c7
+size 4984

run-4/checkpoint-268/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-402/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-402/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0fe00cf0f36f858716e83a6e0010c14f7568f34af5bfdcf8a2539cbf19b8538
+size 267832560

run-4/checkpoint-402/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f29b1d7f3761c2e52bc174d84bd5fa12ae45ddcc7c90546cd5847d64205fa1a
+size 535727290

run-4/checkpoint-402/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcd6b7a38a6047632ee5ad39fcd32f4e17ab531a71382eea1de3c665cd385337
+size 14308

run-4/checkpoint-402/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9674863f352a64a8d6e447b12472ef2193881c5f94ccd249745d33c675cad98
+size 1064

run-4/checkpoint-402/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-402/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-402/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-402/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.5127204235005072,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-402",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 402,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.4793247580528259,
+      "eval_matthews_correlation": 0.41721186495955986,
+      "eval_runtime": 0.7047,
+      "eval_samples_per_second": 1480.003,
+      "eval_steps_per_second": 93.653,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5243192315101624,
+      "eval_matthews_correlation": 0.4857615494749571,
+      "eval_runtime": 0.7767,
+      "eval_samples_per_second": 1342.919,
+      "eval_steps_per_second": 84.979,
+      "step": 268
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6017581224441528,
+      "eval_matthews_correlation": 0.5127204235005072,
+      "eval_runtime": 0.7858,
+      "eval_samples_per_second": 1327.328,
+      "eval_steps_per_second": 83.992,
+      "step": 402
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 8.359942777903227e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-4/checkpoint-402/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe6e3427aa9b8f76859978c9610153c5ea040a7b3849026173b26b4eb6e25c7
+size 4984

run-4/checkpoint-402/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-536/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-536/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da46f7ffbafb86b684fdab60d5ebd77f310ee0f9b88e243454405a1cda6fe856
+size 267832560

run-4/checkpoint-536/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a2d067d324bef3581640d650090bee93348b4db18b3724f47240e15bc783d02
+size 535727290

run-4/checkpoint-536/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d82bf028df2c2e35df0c6c234b9740a0803dfc7005ef2834a500e80e05038eba
+size 14308

run-4/checkpoint-536/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94c8708b3b904da2a14c40f19b022bce13e54bb615c87806b07ba2c36287b911
+size 1064

run-4/checkpoint-536/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-536/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-536/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-536/trainer_state.json ADDED Viewed

	@@ -0,0 +1,69 @@

+{
+  "best_metric": 0.516230230689141,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-536",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 536,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.4793247580528259,
+      "eval_matthews_correlation": 0.41721186495955986,
+      "eval_runtime": 0.7047,
+      "eval_samples_per_second": 1480.003,
+      "eval_steps_per_second": 93.653,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5243192315101624,
+      "eval_matthews_correlation": 0.4857615494749571,
+      "eval_runtime": 0.7767,
+      "eval_samples_per_second": 1342.919,
+      "eval_steps_per_second": 84.979,
+      "step": 268
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6017581224441528,
+      "eval_matthews_correlation": 0.5127204235005072,
+      "eval_runtime": 0.7858,
+      "eval_samples_per_second": 1327.328,
+      "eval_steps_per_second": 83.992,
+      "step": 402
+    },
+    {
+      "epoch": 3.73,
+      "grad_norm": 3.175116539001465,
+      "learning_rate": 2.121179510811267e-05,
+      "loss": 0.2876,
+      "step": 500
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.7295573949813843,
+      "eval_matthews_correlation": 0.516230230689141,
+      "eval_runtime": 0.7821,
+      "eval_samples_per_second": 1333.555,
+      "eval_steps_per_second": 84.386,
+      "step": 536
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 210826263292620.0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 8.359942777903227e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-4/checkpoint-536/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe6e3427aa9b8f76859978c9610153c5ea040a7b3849026173b26b4eb6e25c7
+size 4984

run-4/checkpoint-536/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-670/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-670/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4f236e7bc07911b0202d2a0c9d8b33a102289900d88a1fffd24d6f8a4da5fb74
+size 267832560

run-4/checkpoint-670/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1eea31cd40114c629fd466b9e5185aff0448f319c7202f0c7468edc9eb499841
+size 535727290

run-4/checkpoint-670/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5d032dd752baa9b40c95529b665302cb6ab7131fc6cc6430740e5c15081dc53
+size 14308

run-4/checkpoint-670/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4860180558576ebcfce8a1c9beb42b868dcec43ca037264331469fdb32eeaf44
+size 1064

run-4/checkpoint-670/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-670/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-670/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-670/trainer_state.json ADDED Viewed

	@@ -0,0 +1,78 @@

+{
+  "best_metric": 0.5282404248888111,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-670",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 670,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.4793247580528259,
+      "eval_matthews_correlation": 0.41721186495955986,
+      "eval_runtime": 0.7047,
+      "eval_samples_per_second": 1480.003,
+      "eval_steps_per_second": 93.653,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5243192315101624,
+      "eval_matthews_correlation": 0.4857615494749571,
+      "eval_runtime": 0.7767,
+      "eval_samples_per_second": 1342.919,
+      "eval_steps_per_second": 84.979,
+      "step": 268
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6017581224441528,
+      "eval_matthews_correlation": 0.5127204235005072,
+      "eval_runtime": 0.7858,
+      "eval_samples_per_second": 1327.328,
+      "eval_steps_per_second": 83.992,
+      "step": 402
+    },
+    {
+      "epoch": 3.73,
+      "grad_norm": 3.175116539001465,
+      "learning_rate": 2.121179510811267e-05,
+      "loss": 0.2876,
+      "step": 500
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.7295573949813843,
+      "eval_matthews_correlation": 0.516230230689141,
+      "eval_runtime": 0.7821,
+      "eval_samples_per_second": 1333.555,
+      "eval_steps_per_second": 84.386,
+      "step": 536
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.8349049687385559,
+      "eval_matthews_correlation": 0.5282404248888111,
+      "eval_runtime": 1.5,
+      "eval_samples_per_second": 695.316,
+      "eval_steps_per_second": 43.999,
+      "step": 670
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 210826263292620.0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 8.359942777903227e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-4/checkpoint-670/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe6e3427aa9b8f76859978c9610153c5ea040a7b3849026173b26b4eb6e25c7
+size 4984

run-4/checkpoint-670/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-5/checkpoint-535/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-5/checkpoint-535/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f8faef3b23eaff2c363d74cc3e31d0922f626b504dff2127806023ff5ed2cc6
+size 267832560

run-5/checkpoint-535/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:78d1b067cce2a432c584e3c217b5ac5359b5c9b05f44e0cd28547dd5347db19f
+size 535727290

run-5/checkpoint-535/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcab177d8880a047d5457ee3cb55b6fe077e5fc14e2c24f62896c955493aabb5
+size 14244

run-5/checkpoint-535/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:098d5d650c71f7ffc85040cf920d0791c5a5ae306b5e675f61bb6cca1d8ddea2
+size 1064